﻿<?xml version="1.0" encoding="UTF-8"?><rss xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:atom="http://www.w3.org/2005/Atom" version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd" xmlns:googleplay="http://www.google.com/schemas/play-podcasts/1.0"><channel><title><![CDATA[Aaron Tay's Musings about Librarianship]]></title><description><![CDATA[Aaron Tay's thoughts about academic librarianship ]]></description><link>https://aarontay.substack.com</link><image><url>https://substackcdn.com/image/fetch/$s_!SIBS!,w_256,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdabe20d0-c305-4694-b04d-13176319efee_440x440.png</url><title>Aaron Tay&apos;s Musings about Librarianship</title><link>https://aarontay.substack.com</link></image><generator>Substack</generator><lastBuildDate>Mon, 15 Jun 2026 09:38:50 GMT</lastBuildDate><atom:link href="https://aarontay.substack.com/feed" rel="self" type="application/rss+xml"/><copyright><![CDATA[Aaron Tay]]></copyright><language><![CDATA[en]]></language><webMaster><![CDATA[aarontay@substack.com]]></webMaster><itunes:owner><itunes:email><![CDATA[aarontay@substack.com]]></itunes:email><itunes:name><![CDATA[Aaron Tay]]></itunes:name></itunes:owner><itunes:author><![CDATA[Aaron Tay]]></itunes:author><googleplay:owner><![CDATA[aarontay@substack.com]]></googleplay:owner><googleplay:email><![CDATA[aarontay@substack.com]]></googleplay:email><googleplay:author><![CDATA[Aaron Tay]]></googleplay:author><itunes:block><![CDATA[Yes]]></itunes:block><item><title><![CDATA[What a year of testing & thinking about AI academic search taught me]]></title><description><![CDATA[The Chatbot Is the Wrong Mental Model]]></description><link>https://aarontay.substack.com/p/what-a-year-of-testing-and-thinking</link><guid isPermaLink="false">https://aarontay.substack.com/p/what-a-year-of-testing-and-thinking</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Mon, 08 Jun 2026 01:51:26 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!Puaf!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Puaf!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Puaf!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!Puaf!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!Puaf!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!Puaf!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Puaf!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png" width="1456" height="819" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:819,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:2155948,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Puaf!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!Puaf!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!Puaf!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!Puaf!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc9e2f2f7-9d20-4722-9eed-ffc22e7cba82_1672x941.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em>A look back at the ideas that stuck, the ones I am still unsure about, and where I think this is heading.</em></p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi!</span></a></p><p>About a year ago I shifted my main writing home <a href="https://musingsaboutlibrarianship.blogspot.com/">from blogger</a> to Substack. Since then, this newsletter has grown from roughly 3,000 email subscribers to around 5,500. While the affordances of Substack have made it easier for subscribers to follow, the fact that a niche newsletter about academic search and library technology could add 2,500 readers in a year is mostly a signal about the moment we are in. Librarians, researchers, and tool builders are all unsettled by what &#8220;AI search&#8221; is doing to academic discovery. </p><p>I think there are not many places pondering in the open about what this means, trying to work it out rather than deciding they already have figured out that &#8220;AI&#8221; applies to search (or anything really) is bad. </p><p>If this newsletter has a job, that is the job. Thank you for reading, for arguing in the comments, and for forwarding posts to colleagues who hopefully subscribe.</p><p>If a year of this has taught me one thing, it is that the freeform chatbot is the wrong mental model for academic search. The fear that dominates most discussion, that these systems fabricate sources and invent findings, is real for a naked language model answering from memory or even one with weak naive RAG implementation. </p><p>But wrap a model in an agentic harness that runs deterministic checks in code, and force it to verify every claim against an independent source rather than generate it freely, and most of that risk is manageable (at least for claims that can be checked against independent sources). I was not sure of this twelve months ago, or at least I could not have said it cleanly without experience trying LLMs with agentic harnesses.</p><p>This post provides a thematic retrospective of the content on my blog and ends with some upcoming future content.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><h2>One question, many posts</h2><p>There is a narrower question every post here is also trying to answer: when a vendor says &#8220;AI-powered search&#8221;, what is being claimed, and how should a librarian evaluate it without either hype or unthinking rejection?</p><p>That span of 12 months opened with a two part article <a href="https://aarontay.substack.com/p/how-should-academic-retrieval-augmented">testing how RAG systems handle retracted papers across Elicit, Scite, SciSpace, Primo Research Assistant, Undermind and others</a>, and it closes with sharper &#8220;hot takes&#8221; about where librarianship is misreading the whole category. The through-line is the same: take the tools seriously enough to test them properly, and take our own assumptions seriously enough to question them.</p><h2>Defining the thing before arguing about it</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!6j-9!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!6j-9!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png 424w, https://substackcdn.com/image/fetch/$s_!6j-9!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png 848w, https://substackcdn.com/image/fetch/$s_!6j-9!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png 1272w, https://substackcdn.com/image/fetch/$s_!6j-9!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!6j-9!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png" width="1456" height="1030" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1030,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1761470,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!6j-9!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png 424w, https://substackcdn.com/image/fetch/$s_!6j-9!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png 848w, https://substackcdn.com/image/fetch/$s_!6j-9!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png 1272w, https://substackcdn.com/image/fetch/$s_!6j-9!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23732e4b-bed1-4666-bd96-f6016de0e045_1491x1055.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The post I point newcomers to first is <strong><a href="https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered">What Do We Actually Mean by &#8220;AI-Powered Search&#8221;?</a></strong>. The phrase hides at least four different things: post-retrieval conveniences like summarisation that do not touch your results at all; semantic retrieval using vector embedding that goes beyond lexical matching; LLMs used in retrieval and ranking; and full synthesis and generation across papers. Your concern about one of those may not apply to another, and most of the unproductive arguments I see come from people defending or attacking different levels while using the same words.</p><p>The framework of mine that has resonated the most, though, is a bit older. <strong><a href="https://aarontay.substack.com/p/why-i-think-academic-deep-research">Why I Think Academic Deep Research &#8212; or at Least Deep Search &#8212; Will &#8220;Win&#8221;</a></strong> is where my 2x2 matrix first appeared, and it has since been picked up and cited well beyond this newsletter. </p><p>It sorts search systems along two axes. The first is how the system works: a quick, one-shot retrieval, or a deep, iterative process that evaluates many candidates. The second is what it returns: Search, which only retrieves and ranks documents, or RAG, which extracts from them to generate an answer with citations. That gives four quadrants, Quick Search, Quick RAG, Deep Search and Deep RAG, and most of the products people argue about sit cleanly in one of them. </p><p>The post argues that the deep quadrants are where the future of academic search is heading and <a href="https://aarontay.substack.com/p/what-academic-deep-research-is-really">why Deep Research is mostly meant for helping to orientate yourself</a>. Whatever you make of that call, the 2x2 itself has been the durable contribution.</p><p>If you are wondering what vector embeddings are, a natural companion piece is <strong><a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably">Why Embedding Vector Search Is Probably One of the Least Objectionable Use of AI for Search</a></strong>.  Embedding-based semantic search dodges many, though not all, of the criticisms aimed at ChatGPT-style generative AI. It does not fabricate text or invent citations the way generation can; it only changes how documents are matched and ranked. Map it onto the four levels above and it sits well below full synthesis on the risk gradient, which is worth remembering before treating every form of "AI search" as equally suspect.</p><p>The move to vector embedding is not without direct consequences, and it is the subject of <strong><a href="https://aarontay.substack.com/p/the-case-of-the-vanishing-hit-count">The Case of the Vanishing Hit Count</a></strong>, written up based on a question from my FSCI 2025 workshop. Once you leave Boolean behind for embedding and other AI-driven retrieval, the exact, countable hit set disappears, replaced by the top-k of semantic search or even the evaluated results of deep search, until even the familiar question of how many results you got no longer has a stable answer.</p><p>As I tested and used these new, modern &#8220;AI search&#8221;, I noticed a UX issue which I called initially <strong><a href="https://aarontay.substack.com/p/the-blank-box-problem-why-its-harder">The Blank Box Problem</a></strong>. We spent two decades complaining that users would not learn Boolean operators and field codes. We have now replaced all of that with a single blinking cursor in an empty box, and users are more confused than ever, caught between not knowing how to speak to the machine (keyword, natural language, or elaborate prompt) and not knowing what the machine can even do with their words. Trading visible constraints for infinite potential turns out to be a usability crisis, not a usability win.</p><p>Finally, I attempted to <a href="https://aarontay.substack.com/p/classifying-the-ways-llms-summarise">classify the ways LLMs summarise</a> in tools like EBSCO and ProQuest. I distinguish between fixed single-document summaries, query-dependent single-document answers, document-by-document synthesis tables, and full multi-document RAG synthesis. The classification shows that &#8220;AI summaries&#8221; are not one thing: as tools move from pre-canned article summaries to query-driven synthesis across many papers, usefulness rises, but so do unpredictability, evaluation difficulty, and trust risks.</p><h2>Deflating the hype, without dismissing the tools</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!WCs6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!WCs6!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png 424w, https://substackcdn.com/image/fetch/$s_!WCs6!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png 848w, https://substackcdn.com/image/fetch/$s_!WCs6!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png 1272w, https://substackcdn.com/image/fetch/$s_!WCs6!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!WCs6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png" width="1448" height="1086" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1086,&quot;width&quot;:1448,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1920026,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!WCs6!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png 424w, https://substackcdn.com/image/fetch/$s_!WCs6!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png 848w, https://substackcdn.com/image/fetch/$s_!WCs6!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png 1272w, https://substackcdn.com/image/fetch/$s_!WCs6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8ddbc852-0b1f-477f-80c4-7a01544e45d6_1448x1086.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>While I am known to be &#8220;pro-AI&#8221;, particularly for search - I have pushed back on many over-claims and warned about issues this new technology brings.</p><p><strong><a href="https://aarontay.substack.com/p/the-ai-powered-library-search-that">The AI-Powered Library Search That Refused to Search</a></strong> is probably one of the most read posts on my Substack so far, perhaps because critical posts about AI travel further than careful ones.<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a>.</p><p>It documents an odd new problem: content-moderation layers designed for chatbots are creeping into library discovery and quietly refusing to search certain controversial topics at all. How serious this is, I am not yet sure.</p><p><strong><a href="https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search">The Horseless Carriage of AI Search</a></strong> takes aim at an increasingly common pattern in legacy databases, the claim that they now &#8220;do AI&#8221;. It argues that bolting an LLM onto the front of a database, such as Primo Research Assistant, to generate Boolean strings is mostly of little benefit. I am not saying Boolean must die, but I am saying that dressing up the old engine is not the breakthrough it is sold as. I have since had to qualify this argument, and I come back to exactly where it breaks near the end.</p><p><strong><a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">Deep Research, Shallow Agency</a></strong> takes aim at the word agentic. Most academic deep research tools at the time, such as Asta Paper Finder, Undermind Classic and Scholar Labs, run fixed internal workflows, and they stumble the moment you hand them a literature review task that does not fit what they were built to solve. The agency is largely an illusion.</p><p>The follow-up, <strong><a href="https://aarontay.substack.com/p/from-fixed-search-workflows-to-agentic">From Fixed Search Workflows to Agentic Academic Search: Promise, Progress, and the Invisible Menu Problem</a>, looks at what happens as tools start handing control back to users. Undermind&#8217;s Projects feature is the worked example: it lets you steer and manage the agent rather than accept a fixed pipeline, which is real progress. But it also exposes what I call the Invisible Menu Problem. When you are managing an agent, you cannot see the full menu of what it can do, so you are left guessing at its capabilities and limits. It echoes the Blank Box Problem one level up, with the opacity shifted from the query to the agent itself.</strong></p><p>In <a href="https://aarontay.substack.com/p/are-ai-tools-killing-review-articles">Are AI Tools Killing Review Articles? Two Failure Modes Suggest Otherwise</a>, I argued that the most important kinds of review articles are still hard for AI, for two reasons: the corpus construction gap, where tools still struggle with retrieval and exhaustiveness, and the conceptualisation gap, where expert judgement is needed before retrieval even begins.</p><h2>The uncomfortable mirror for librarians</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!4RRc!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!4RRc!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png 424w, https://substackcdn.com/image/fetch/$s_!4RRc!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png 848w, https://substackcdn.com/image/fetch/$s_!4RRc!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png 1272w, https://substackcdn.com/image/fetch/$s_!4RRc!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!4RRc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png" width="1055" height="1491" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/db0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1491,&quot;width&quot;:1055,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1772888,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!4RRc!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png 424w, https://substackcdn.com/image/fetch/$s_!4RRc!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png 848w, https://substackcdn.com/image/fetch/$s_!4RRc!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png 1272w, https://substackcdn.com/image/fetch/$s_!4RRc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb0f20e9-98d4-44cb-a431-a2b9c0b6b7e8_1055x1491.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>A few posts are aimed squarely at us librarians. </p><p><strong><a href="https://aarontay.substack.com/p/were-good-at-search-just-not-the">&#8220;We&#8217;re Good at Search,&#8221; Just Not the Kind the AI Era Demands</a></strong> is a deliberate provocation. When I look at the evaluation rubrics for AI search now circulating, relevancy is often just one subjective category among many, scored on an &#8220;I know it when I see it&#8221; basis. For a profession that prides itself on search, that is a strange place to be. </p><p><strong><a href="https://aarontay.substack.com/p/ai-academic-search-and-the-missing">AI Academic Search and the Missing Middle of Literature Discovery</a></strong> makes a related point: I argue by judging these tools mainly through undergraduate information literacy and through evidence synthesis, we underrate their strongest current use case, the ordinary narrative literature review, perhaps because our involvement here is less.</p><p>My most recent post, <strong><a href="https://aarontay.substack.com/p/hot-take-stop-calling-poor-search">Stop Calling Poor Search Rankings Necessary Friction for Learning</a></strong>, takes aim at a comfortable rationalisation. When a system ranks badly, it is tempting to argue that the struggle is good for students, that wading through irrelevant results teaches them something. There is a legitimate version of that idea, where we set out to expose students to adjacent and boundary literature, but that is intentional design. Defending accidental noise as if it were pedagogy is not the same thing, and we should stop confusing the two.</p><p>This connects directly to an older post, <em><a href="https://aarontay.substack.com/p/the-sycophancy-fallacy-why-you-may">The Sycophancy Fallacy</a></em>. Both are the same category error: mistaking a ranking system&#8217;s output for a stance. The worry that AI search tools will agree with users the way chatbots do treats retrieval as a conversational partner that can flatter. A retrieval system is not agreeing with you, it is returning what its ranking surfaces. Confusing the two means worrying about the wrong bias and missing the real ones.</p><p>The last is a little left field, since digital literacy is not my speciality. <a href="https://aarontay.substack.com/p/fact-checking-vs-academic-inquiry">Fact-Checking vs the Academic Inquiry Mindset</a> asks whether we are collapsing two different habits of mind into one. Verifying a discrete claim is not the same as open-ended scholarly inquiry, and treating the first as though it were the second risks leaving students short of what research demands.</p><p> </p><h2>The plumbing problems nobody is watching</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!wAJp!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!wAJp!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!wAJp!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!wAJp!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!wAJp!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!wAJp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png" width="1456" height="819" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/eb36b9f7-3c18-4e70-af74-286294129439_1672x941.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:819,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1721191,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!wAJp!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!wAJp!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!wAJp!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!wAJp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb36b9f7-3c18-4e70-af74-286294129439_1672x941.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> The least glamorous posts may matter most. <strong><a href="https://aarontay.substack.com/p/the-petrol-tank-for-ai-discovery">The Petrol Tank for AI Discovery Might Be Running Dry</a></strong> flags that the comprehensive AI search engines we are starting to lean on, such as Elicit, Consensus and Undermind, depend on access to abstracts and full text that publishers now have a strong commercial incentive to close off.</p><p><strong><a href="https://aarontay.substack.com/p/why-ghost-references-still-haunt">Why Ghost References Still Haunt Us</a></strong> makes two claims: that Google Scholar's <code>[CITATION]</code> entries and a polluted web can undermine the verification RAG depends on, and that fabricated and ghost references often predate LLMs. I am confident about the first for reasons I give below.  </p><h2>Trying to explain and understand</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!jh9e!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!jh9e!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!jh9e!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!jh9e!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!jh9e!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!jh9e!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png" width="1456" height="819" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:819,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1827516,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!jh9e!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!jh9e!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!jh9e!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!jh9e!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9392897d-6fe3-47d3-810b-c2e2a3f041f0_1672x941.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>About a year ago, I felt a sense of unease whenever I heard the term agentic search, (mostly in the context of Undermind), I had an uneasy sense that I did not really fully understand what it meant.</p><p>As I spent time thinking about it, trying MCP servers, skills, and finally LLMs with agentic harnesses like Claude Code and Codex, something clicked.</p><p><strong><a href="https://aarontay.substack.com/p/creating-your-own-research-assistant">The Agentic Researcher</a></strong> and the <strong><a href="https://aarontay.substack.com/p/mcp-servers-and-academic-search-the">MCP server posts</a></strong> were two of my earliest posts documenting my growing sense of understanding of what &#8220;agentic&#8221; means.</p><p>By pairing a general LLM with academic Model Context Protocol servers or other tools, they can match or beat specialised deep research tools. This may point to a real-time, federated model of access to publisher content rather than yet another giant centralised index.</p><h2>Reviews &amp; evaluation frameworks</h2><p>I did some hands-on reviews of <a href="https://aarontay.substack.com/p/a-2025-deep-dive-of-consensus-promises">Consensus</a>, <a href="https://aarontay.substack.com/p/scholar-labs-early-review-google">Scholar Labs</a>, <a href="https://aarontay.substack.com/p/researchrabbits-2025-revamp-iterative">ResearchRabbit</a> and <a href="https://aarontay.substack.com/p/googles-ai-mode-it-can-out-search">Google&#8217;s AI Mode</a> as they shipped.</p><p>Librarians are always interested in evaluation frameworks, so in <em><a href="https://aarontay.substack.com/p/ai-academic-search-needs-better-frameworks">AI academic search needs better frameworks for understanding and evaluation</a></em> I pointed to three librarian projects I found promising. That was followed by <em><a href="https://aarontay.substack.com/p/better-ai-search-rubrics-roles-gates">Better AI Search Rubrics: Roles, Gates, and Retrieval Tests</a></em>, an opinionated piece on the common weaknesses in such rubrics and ways to improve them.</p><p> </p><h2>Other posts of interest beyond the twelve-month window</h2><p>I did not suddenly start writing about AI search when I moved here. A few from outside this window that I still consider significant, now cloned onto Substack from my Blogger platform:</p><ul><li><p><a href="https://aarontay.substack.com/p/the-reproducibility-and">The reproducibility and interpretability of academic Ai Search engines like Primo Research Assistant, Web of Science Research Assistant, Scopus AI and more</a></p></li><li><p><a href="https://aarontay.substack.com/p/testing-ai-academic-search-engines-1https://aarontay.substack.com/p/testing-ai-academic-search-engines-1">Testing AI Academic Search Engines (1): Defining the tools</a> &amp; <strong><a href="https://aarontay.substack.com/p/testing-ai-academic-search-engines-what">Testing AI Academic Search Engines - What to find out and how to test (2)</a></strong></p></li><li><p><a href="https://aarontay.substack.com/p/comparative-review-on-primo-research">Comparative review on Primo Research Assistant, Scopus AI, Web of Science Research Assistant and an explainer for AI search for librarians</a></p></li><li><p><a href="https://aarontay.substack.com/p/when-is-hallucination-not-hallucination">When is a Hallucination Not a Hallucination? The Role of Implicit Knowledge in RAG</a></p></li><li><p><a href="https://aarontay.substack.com/p/the-rise-of-agent-based-deep-research">The Rise of Agent-Based Deep Research: Exploring OpenAI&#8217;s Deep Research, Gemini Deep Research, Perplexity Deep Research, Ai2 ScholarQA, STORM, and More in 2025</a></p></li><li><p><a href="https://aarontay.substack.com/p/why-use-of-new-ai-enhanced-tools-that">Why use of new AI enhanced tools that help with literature review should be discouraged for undergraduates</a></p></li><li><p><a href="https://aarontay.substack.com/p/primo-research-assistant-launches-first">Primo Research Assistant launches- a first look and some things you should know</a></p></li></ul><p></p><h2>What I am unsure about, and what comes next</h2><p>In keeping with how I try to write, the honest caveat: a lot of this is provisional, and some of it will age badly. The landscape shifts month to month, and several posts above are me thinking out loud rather than concluding. </p><p>Two examples.</p><p>The first is the <a href="https://aarontay.substack.com/p/why-ghost-references-still-haunt">ghost references post</a>. I stand by the weakness it identifies in Google Scholar, but I am no longer confident in its conclusion that in the example I investigated the first version of the ghost reference I traced was human-made rather than produced by an LLM. Treat that part as an open question rather than a finding.</p><p></p><h3>Where my &#8220;horseless carriage&#8221; critique breaks</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!_Ts_!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!_Ts_!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!_Ts_!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!_Ts_!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!_Ts_!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!_Ts_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png" width="1456" height="819" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:819,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1645963,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!_Ts_!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!_Ts_!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!_Ts_!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!_Ts_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5700c6d2-4486-479d-a848-581d5a4be381_1672x941.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The second I have to own more directly. I was proud of <em><a href="https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search">The Horseless Carriage of AI Search</a></em>, my critique of legacy vendors taking the easy route to &#8220;implement AI&#8221; by using an LLM only to generate Boolean. </p><p>After using Primo&#8217;s MCP server I have had to qualify it. </p><p>The critique was aimed at one specific move: using an LLM as a translation layer that feeds Boolean into the same lexical engine over the same document corpus. I still think that is mostly low-value. </p><p>What I missed is that database and dataset selection is a different task from normal article search. </p><p>There the target is a small, description-only space, and the model earns its keep two ways. It normalises vocabulary, and it draws on pretraining knowledge to go straight to the right resource. That is not dressing up the old engine. It is doing something the old engine could not. The critique holds for article retrieval and does not generalise to query-to-resource matching.</p><p>A concrete example helps clarify. </p><p>Experienced librarians know that users struggle to find the right database for datasets, because their query terms have to match a very small target space, the database description. A wrong term returns zero hits: <a href="https://search.library.smu.edu.sg/discovery/search?query=any,contains,cost%20of%20living&amp;tab=Catalogue&amp;vid=65SMU_INST:SMU_NUI&amp;lang=en&amp;offset=0&amp;sortby=rank&amp;facet=rtype,include,databases">search for cost of living datasets/databases rather than CPI and you find nothing</a>.  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!S0T4!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!S0T4!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp 424w, https://substackcdn.com/image/fetch/$s_!S0T4!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp 848w, https://substackcdn.com/image/fetch/$s_!S0T4!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp 1272w, https://substackcdn.com/image/fetch/$s_!S0T4!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!S0T4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp" width="830" height="838" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:838,&quot;width&quot;:830,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!S0T4!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp 424w, https://substackcdn.com/image/fetch/$s_!S0T4!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp 848w, https://substackcdn.com/image/fetch/$s_!S0T4!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp 1272w, https://substackcdn.com/image/fetch/$s_!S0T4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9357228e-53b9-440b-a33c-f4a9b4cb7a3f_830x838.webp 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>A capable LLM sidesteps this, because it knows to search for the right terms,  <a href="https://search.library.smu.edu.sg/discovery/search?query=any%2Ccontains%2CCPI&amp;tab=Catalogue&amp;search_scope=MyInstitution&amp;vid=65SMU_INST%3ASMU_NUI&amp;lang=en&amp;offset=0&amp;sortby=rank&amp;facet=rtype%2Cinclude%2Cdatabases">CPI</a>, <a href="https://search.library.smu.edu.sg/discovery/search?query=any%2Ccontains%2Cinflation&amp;tab=Catalogue&amp;search_scope=MyInstitution&amp;vid=65SMU_INST%3ASMU_NUI&amp;lang=en&amp;offset=0&amp;sortby=rank&amp;facet=rtype%2Cinclude%2Cdatabases">inflation</a> , and so on.   </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!WryY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!WryY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp 424w, https://substackcdn.com/image/fetch/$s_!WryY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp 848w, https://substackcdn.com/image/fetch/$s_!WryY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp 1272w, https://substackcdn.com/image/fetch/$s_!WryY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!WryY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp" width="836" height="425" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:425,&quot;width&quot;:836,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!WryY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp 424w, https://substackcdn.com/image/fetch/$s_!WryY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp 848w, https://substackcdn.com/image/fetch/$s_!WryY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp 1272w, https://substackcdn.com/image/fetch/$s_!WryY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F21dfa4cf-ebac-46bc-8982-c4e3a36af3c2_836x425.webp 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Claude 4.8 is similarly smart, reasoning (after searching) that most database records will not have &#8220;cost of living&#8221; in their metadata and switching to searching Economic databases.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!jhnq!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!jhnq!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png 424w, https://substackcdn.com/image/fetch/$s_!jhnq!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png 848w, https://substackcdn.com/image/fetch/$s_!jhnq!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png 1272w, https://substackcdn.com/image/fetch/$s_!jhnq!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!jhnq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png" width="1009" height="690" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:690,&quot;width&quot;:1009,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:148366,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!jhnq!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png 424w, https://substackcdn.com/image/fetch/$s_!jhnq!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png 848w, https://substackcdn.com/image/fetch/$s_!jhnq!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png 1272w, https://substackcdn.com/image/fetch/$s_!jhnq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2d31d3d5-68a1-445a-a277-cb513ad3e0b1_1009x690.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>But what if the database description just doesn&#8217;t have the right terms? Here is where LLMs can also help by &#8220;cheating&#8221; because they already know the answer (from pretraining knowledge).</p><p>In this query, I asked for datasets with the right terms and it seems to do as expected, surfacing the obvious databases.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!wFFI!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!wFFI!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp 424w, https://substackcdn.com/image/fetch/$s_!wFFI!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp 848w, https://substackcdn.com/image/fetch/$s_!wFFI!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp 1272w, https://substackcdn.com/image/fetch/$s_!wFFI!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!wFFI!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp" width="849" height="790" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:790,&quot;width&quot;:849,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!wFFI!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp 424w, https://substackcdn.com/image/fetch/$s_!wFFI!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp 848w, https://substackcdn.com/image/fetch/$s_!wFFI!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp 1272w, https://substackcdn.com/image/fetch/$s_!wFFI!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8f90d6d7-d3ae-4be1-8451-bde3615c11af_849x790.webp 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>But then I noticed the searches it did</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ouTf!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ouTf!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp 424w, https://substackcdn.com/image/fetch/$s_!ouTf!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp 848w, https://substackcdn.com/image/fetch/$s_!ouTf!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp 1272w, https://substackcdn.com/image/fetch/$s_!ouTf!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ouTf!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp" width="318" height="107" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:107,&quot;width&quot;:318,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ouTf!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp 424w, https://substackcdn.com/image/fetch/$s_!ouTf!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp 848w, https://substackcdn.com/image/fetch/$s_!ouTf!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp 1272w, https://substackcdn.com/image/fetch/$s_!ouTf!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2a90ed17-15ba-4dd0-b7e0-85cec1aabe7f_318x107.webp 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>The <a href="https://search.library.smu.edu.sg/discovery/search?query=any%2Ccontains%2Cexecutive+compensation&amp;tab=Catalogue&amp;search_scope=MyInstitution&amp;vid=65SMU_INST%3ASMU_NUI&amp;lang=en&amp;offset=0&amp;sortby=rank&amp;facet=rtype%2Cinclude%2Cdatabases">first search was expected</a> but the <a href="https://search.library.smu.edu.sg/discovery/search?query=any%2Ccontains%2CExecuComp&amp;tab=Catalogue&amp;search_scope=MyInstitution&amp;vid=65SMU_INST%3ASMU_NUI&amp;lang=en&amp;offset=0&amp;sortby=rank&amp;facet=rtype%2Cinclude%2Cdatabases">second was odd - a known item search of the dataset ExecuComp! </a>In short, a large LLM is capable of knowing the right answer in advance and just search to confirm we had access! </p><p>Below shows yet another similar example, where it searched directly for Audit Analytics (a known item search of a dataset in WRDS) when asked about datasets on audit reports.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!jQe3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!jQe3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png 424w, https://substackcdn.com/image/fetch/$s_!jQe3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png 848w, https://substackcdn.com/image/fetch/$s_!jQe3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png 1272w, https://substackcdn.com/image/fetch/$s_!jQe3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!jQe3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png" width="809" height="246" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/dd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:246,&quot;width&quot;:809,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:15705,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!jQe3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png 424w, https://substackcdn.com/image/fetch/$s_!jQe3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png 848w, https://substackcdn.com/image/fetch/$s_!jQe3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png 1272w, https://substackcdn.com/image/fetch/$s_!jQe3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd8095bd-9d8d-4914-b731-2e66ae63477d_809x246.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>What comes next is going to double down on understanding agents. <a href="https://ink.library.smu.edu.sg/force2026/Programme/agenda/20/">At FORCE2026 I presented a small study of the reproducibility of the agentic search tools Undermind and Consensus</a> with the title -<em> Does Agentic Deep Search Converge? Reproducibility Questions for LLM-Driven Literature Discovery</em>, and the results were &#8220;interestingly wrong&#8221; in ways worth writing up here. </p><p></p><h3>An agentic skill for building and testing high sensitivity Boolean Search Strategies for Pubmed.</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!CCcu!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!CCcu!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png 424w, https://substackcdn.com/image/fetch/$s_!CCcu!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png 848w, https://substackcdn.com/image/fetch/$s_!CCcu!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png 1272w, https://substackcdn.com/image/fetch/$s_!CCcu!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!CCcu!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png" width="1122" height="1402" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/a3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1402,&quot;width&quot;:1122,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1632772,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/200973726?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!CCcu!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png 424w, https://substackcdn.com/image/fetch/$s_!CCcu!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png 848w, https://substackcdn.com/image/fetch/$s_!CCcu!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png 1272w, https://substackcdn.com/image/fetch/$s_!CCcu!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa3020cba-00b5-49ee-b114-c411262bb022_1122x1402.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The bigger piece is one I have put off for too long, out of impostor syndrome and a sense of how evidence synthesis librarians might react (exacting high standards for obvious reasons): a write-up of a Claude and Codex skill I built for high-sensitivity Boolean searching in PubMed. </p><ul><li><p>It is designed to heavily do tool use, using PubMed searching and MeSH browsing to check for promising terms, test pilot search strategies etc. </p></li><li><p>Instructions also include very specific domain knowledge on how to go about conducting the process based on my (somewhat limited) knowledge of best practices.</p></li><li><p>Comprehensive audit logging, so you can see at every step what was done and the decision made</p></li><li><p>Hooks that use code to enforce important steps and checks</p></li><li><p>Maybe 50+ hours of testing against gold standard sets to test for edge cases.</p></li></ul><p>It is the most concrete demonstration I have of the argument I opened with. Once you wrap the model in a harness that can run deterministic checks in code and make it verify its claims against independent sources rather than generate them, much of what people fear about fabrication stops being inevitable. </p><p>The PubMed skill is one small instance of that pattern, and I think it generalises. Descriptive and subject cataloguing is another domain where a similar method could be applied.</p><p>While I don&#8217;t think my home-brew skill currently exceeds the best experts, it has reached the point where it can reproduce or improve on many of the moves I would make myself, while logging and checking them more consistently (which is why I can&#8217;t improve it further easily). I suspect a team consisting of expert evidence synthesis experts and professional coders will be able to push it far further than what I did.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi!</span></a></p><h2>Conclusion</h2><p>Agentic skills scare me because they look like a second attempt at expert systems, but with a crucial difference. The old systems tried to hard-code expertise. The new ones combine flexible language-model reasoning with tools, logs, tests, and code-enforced constraints. Maybe even that isn&#8217;t enough, but this &#8220;neurosymbolic AI&#8221; approach  does make them much more plausible as systems for operationalising professional judgement with all the obvious implications<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>.</p><p>Yes, I could be totally wrong. Even then, I would rather name what could be better and be wrong in public than pretend something is settled. If a take here does not hold up in a year, I would sooner hear about it than quietly forget I wrote it.</p><p>That goes especially for the readers who arrived through my more critical posts, and who I suspect sit closer to the resist-AI end of things. I hope some of you stayed once it was clear that I am, on the whole, positive about AI for search, and I would rather argue it out with you than preach to people who already agree.</p><p>Thank you, then, for a year of reading and pushing back. The work is better for it. Here is to the next set of posts, and to being usefully wrong together.</p><div class="captioned-button-wrap" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/what-a-year-of-testing-and-thinking?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="CaptionedButtonToDOM"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! This post is public so feel free to share it.</p></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/what-a-year-of-testing-and-thinking?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/p/what-a-year-of-testing-and-thinking?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p></div><p></p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>It also got me a ton of subscribers, I suspect many are in the &#8220;resist AI&#8221; camp. I do hope at least some of them stuck around, after they realised I am on the whole very positive about the use of AI for search.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>Watching Codex or Claude run code and get an error, then smoothly work around it for the first time was an eye-opener. You could even then ask it to fix the skill so future runs would not get this issue!</p></div></div>]]></content:encoded></item><item><title><![CDATA[Hot take: Stop calling poor search rankings necessary friction for learning]]></title><description><![CDATA[Boundary learning, adjacent literature, and why intentional design beats accidental noise.]]></description><link>https://aarontay.substack.com/p/hot-take-stop-calling-poor-search</link><guid isPermaLink="false">https://aarontay.substack.com/p/hot-take-stop-calling-poor-search</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Mon, 01 Jun 2026 19:25:54 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!gPoc!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!gPoc!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!gPoc!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!gPoc!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!gPoc!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!gPoc!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!gPoc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png" width="1456" height="819" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:819,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:2019348,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!gPoc!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png 424w, https://substackcdn.com/image/fetch/$s_!gPoc!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png 848w, https://substackcdn.com/image/fetch/$s_!gPoc!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png 1272w, https://substackcdn.com/image/fetch/$s_!gPoc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9ab11e3f-336d-4d41-9e33-9b80b906334d_1672x941.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em>This post is part of a &#8220;hot takes&#8221; series in which I make sharper claims than I usually do. I do not intend to offend, and I am not trying to tar every librarian with the same brush &#8212; the patterns I describe and perceive may be a function of my own local context. <a href="https://aarontay.substack.com/p/ai-academic-search-and-the-missing"> In my last hot takes post</a>, I argued that quality AI search that gives better rankings might not be fit for purpose for a librarian teaching undergraduate information literacy because &#8220;friction is pedagogically useful and one could even argue better search results removes friction!&#8221;. Here I examine this argument more carefully.</em></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!GmiH!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!GmiH!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png 424w, https://substackcdn.com/image/fetch/$s_!GmiH!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png 848w, https://substackcdn.com/image/fetch/$s_!GmiH!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png 1272w, https://substackcdn.com/image/fetch/$s_!GmiH!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!GmiH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png" width="1251" height="693" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:693,&quot;width&quot;:1251,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!GmiH!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png 424w, https://substackcdn.com/image/fetch/$s_!GmiH!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png 848w, https://substackcdn.com/image/fetch/$s_!GmiH!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png 1272w, https://substackcdn.com/image/fetch/$s_!GmiH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a8b6640-8803-44be-8a2e-122a6ef3359b_1251x693.png 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi!</span></a></p><p></p><p>Months ago I read a review of an AI search tool that spent most of its length complaining about how poorly the tool ranked results, then made a striking turn at the end: poor relevancy ranking was supposedly a virtue, because learning needs friction.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!P3u4!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!P3u4!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png 424w, https://substackcdn.com/image/fetch/$s_!P3u4!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png 848w, https://substackcdn.com/image/fetch/$s_!P3u4!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png 1272w, https://substackcdn.com/image/fetch/$s_!P3u4!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!P3u4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png" width="1251" height="709" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:709,&quot;width&quot;:1251,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:945347,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!P3u4!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png 424w, https://substackcdn.com/image/fetch/$s_!P3u4!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png 848w, https://substackcdn.com/image/fetch/$s_!P3u4!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png 1272w, https://substackcdn.com/image/fetch/$s_!P3u4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8dcb36ae-ead6-4fad-8ac2-510477990664_1251x709.png 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>My first reaction was that this confused good friction (the cognitive effort required to master a topic&#8217;s boundaries) with bad friction (the time wasted fighting unintutive operators, lexical noise and uninformative junk)<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a>. But that is too easy a dismissal. Versions of the argument keep resurfacing, and underneath the crude version is a harder question that does not collapse so quickly.</p><p>Before diving in, some quick framing notes. </p><p>First, I am talking about ordinary narrative reviews and information-literacy contexts; systematic reviews have different requirements and are set aside here. </p><p>Second, if you think no AI search system currently gives materially better results than a traditional BM25 discovery layer, bracket that for now. <a href="https://aarontay.substack.com/p/ai-academic-search-and-the-missing#:~:text=But%20if%20you%20need%20one%20tool%20to%20point%20at%20that%20I%20consider%20a%20%E2%80%9Cbetter%20AI%20seach%20tool%E2%80%9D%20%2D%20I%20would%20consider%20Undermind.ai%20as%20an%20example2.">Assume a genuinely better-ranking system and ask what follows</a>.</p><p>Lastly, I am holding the interface constant. Much of the current anxiety about AI search is really anxiety about RAG-style answer engines and/or <a href="https://aarontay.substack.com/p/why-i-think-academic-deep-research">deep research tools</a>: systems where the user types a question, gets back a synthesised response, and may never seriously engage with the underlying documents. </p><p><a href="https://www.oneusefulthing.org/p/choosing-to-stay-human">Ethan Mollick has recently documented real instances of this kind of cognitive surrender</a>. That is a legitimate concern that deserves discussion, but in this essay I focus just on better retrieval and ranking. If better ranking alone is supposed to damage learning, we should be able to say exactly how.</p><h2><strong>The weak arguments</strong></h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!zuN6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!zuN6!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png 424w, https://substackcdn.com/image/fetch/$s_!zuN6!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png 848w, https://substackcdn.com/image/fetch/$s_!zuN6!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png 1272w, https://substackcdn.com/image/fetch/$s_!zuN6!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!zuN6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png" width="1254" height="703" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:703,&quot;width&quot;:1254,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:789394,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!zuN6!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png 424w, https://substackcdn.com/image/fetch/$s_!zuN6!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png 848w, https://substackcdn.com/image/fetch/$s_!zuN6!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png 1272w, https://substackcdn.com/image/fetch/$s_!zuN6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F82ade794-3f77-4d14-8d87-491d606888b9_1254x703.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Before getting to the harder question, three things need to be cleared away.</p><p>The first is a reflex that often appears when new tools arrive - making it easier to do things that once was hard and required expertise. Many experts, may be tempted by the idea that struggle is inherently virtuous, and that making something easier is a bad idea.  Perhaps some experts might even have an unconscious vested interest in defending their hard-won expertise, grasping at the friction argument as a justification<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>. </p><p>The second is a concern often raised alongside the friction argument: that LLM- and <a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably">embedding-based systems</a> encode biases that could be amplified at scale if every novice uses the same AI-ranked tool to map a field. This is real, but it is a different question. Leaving aside that there are a huge variety of AI search engines using very different techniques, traditional lexical systems are not neutral either, and people worried about the dominance of Google Scholar amplifying bias. The homogenisation worry is better understood as an argument for epistemic diversity, interface pluralism, and transparency about retrieval choices, rather than for inferior ranking<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-3" href="#footnote-3" target="_self">3</a>.  </p><p>The third is the crude claim that poor ranking is itself mostly or even always educationally valuable. It is not, and one test disposes of it. If poor ranking were valuable as such, we ought in principle to be willing to worsen it deliberately: degrade the scoring function, shuffle the top results, inject noise. At the extreme, results should be totally random! Nobody wants that. </p><p>But no reasonable person believes that? What about a much weaker claim, such that you believe the friction from poor relevancy ranking is &#8220;sometimes valuable&#8221;? This is what the rest of the post takes up. My belief is, the educational value of poor relevancy, if any, does not lie in worse ranking itself. Rather, it is an effect that weak ranking sometimes produces by accident<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-4" href="#footnote-4" target="_self">4</a>.</p><p> </p><h2>The question worth asking</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!DdbI!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!DdbI!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png 424w, https://substackcdn.com/image/fetch/$s_!DdbI!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png 848w, https://substackcdn.com/image/fetch/$s_!DdbI!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png 1272w, https://substackcdn.com/image/fetch/$s_!DdbI!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!DdbI!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png" width="1256" height="703" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:703,&quot;width&quot;:1256,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:265691,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!DdbI!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png 424w, https://substackcdn.com/image/fetch/$s_!DdbI!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png 848w, https://substackcdn.com/image/fetch/$s_!DdbI!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png 1272w, https://substackcdn.com/image/fetch/$s_!DdbI!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F606d8005-7795-45b4-bc83-46451ad080b4_1256x703.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>What survives, once those are set aside, is a harder question. Suppose we had a search system that ranked documents perfectly by topical relevance, by every standard IR measure: precision, recall, nDCG. Would it also be the best system for someone learning a topic<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-5" href="#footnote-5" target="_self">5</a>? If no, then in what way, and why?</p><p>I have always thought the answer was clearly yes, but the more I thought about it, the more I felt this question is a interesting one; the rest of this post is an attempt to answer it. I have discussed this with librarians who hold the view that a very good, or even perfect, retrieval and ranking system would be pedagogically detrimental, and this is my best attempt to steelman their argument.</p><p>The short version: great topical ranking and pedagogical value can and sometimes do diverge in particular ways, but the reasons matter. They do not automatically justify poor ranking or vindicate the friction case in a straightforward way. Instead, they argue for designing systems and pedagogy around the things straight-forward good ranking alone cannot deliver<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-6" href="#footnote-6" target="_self">6</a>.</p><h2>The different types of irrelevance</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!chHi!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!chHi!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png 424w, https://substackcdn.com/image/fetch/$s_!chHi!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png 848w, https://substackcdn.com/image/fetch/$s_!chHi!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png 1272w, https://substackcdn.com/image/fetch/$s_!chHi!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!chHi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png" width="1249" height="707" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:707,&quot;width&quot;:1249,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:681321,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!chHi!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png 424w, https://substackcdn.com/image/fetch/$s_!chHi!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png 848w, https://substackcdn.com/image/fetch/$s_!chHi!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png 1272w, https://substackcdn.com/image/fetch/$s_!chHi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0a40640-0a96-4ccb-bf31-91883bdd2ba0_1249x707.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Let me suggest that not all irrelevant results are equal.</p><p>Some irrelevance in a result list is informative. An &#8220;irrelevant&#8221; result that appears because it belongs to an adjacent subfield, uses overlapping vocabulary, or reflects a nearby conceptual frame may genuinely help a learner understand where a topic begins and ends.</p><p>Other irrelevance is uninformative. A hit that appears because of a homonym, a stopword quirk, or a lexical accident teaches the novice nothing about the structure of the field. It teaches, at most, that search language can be messy<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-7" href="#footnote-7" target="_self">7</a>.</p><p>Poor ranking does not discriminate between these. It produces a messy mixture of both, especially for novices, who are least equipped to tell the difference. So the answer to the harder question takes a particular shape: when topical ranking and pedagogical value come apart, it is because better ranking can remove informative irrelevance along with the uninformative kind. If that is right, the response is not worse ranking. It is intentional design.</p><p>Two careful versions of the objection are worth examining through this lens.</p><h3><strong>Version one: seeing search terms in context</strong></h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!60Rj!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!60Rj!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png 424w, https://substackcdn.com/image/fetch/$s_!60Rj!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png 848w, https://substackcdn.com/image/fetch/$s_!60Rj!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png 1272w, https://substackcdn.com/image/fetch/$s_!60Rj!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!60Rj!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png" width="1249" height="701" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:701,&quot;width&quot;:1249,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:777770,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!60Rj!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png 424w, https://substackcdn.com/image/fetch/$s_!60Rj!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png 848w, https://substackcdn.com/image/fetch/$s_!60Rj!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png 1272w, https://substackcdn.com/image/fetch/$s_!60Rj!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc28921bb-b298-401c-a4c3-41f82d02c08c_1249x701.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The first argument is that students benefit from seeing the terms from their assignment prompt used in actual scholarly contexts, and from gradually learning the vocabulary of a field through retrieval itself.</p><p>That is plausible, and it is also not undermined by better ranking. If anything, accurate ranking increases the chance that students encounter their search terms in genuinely relevant documents rather than tangential ones. The vocabulary they see on a precise hit is more likely to belong to the field than the vocabulary they would have encountered on a near-miss caused by a lexical accident.</p><p>This version survives only if novices learn vocabulary better from a noisier signal than a cleaner one. Pedagogically, I don&#8217;t see why this is the case.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!e4_o!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!e4_o!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png 424w, https://substackcdn.com/image/fetch/$s_!e4_o!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png 848w, https://substackcdn.com/image/fetch/$s_!e4_o!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png 1272w, https://substackcdn.com/image/fetch/$s_!e4_o!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!e4_o!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png" width="1218" height="677" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:677,&quot;width&quot;:1218,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:593166,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!e4_o!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png 424w, https://substackcdn.com/image/fetch/$s_!e4_o!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png 848w, https://substackcdn.com/image/fetch/$s_!e4_o!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png 1272w, https://substackcdn.com/image/fetch/$s_!e4_o!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F47c87f6b-71cf-4a81-be95-080e3a1bb6c3_1218x677.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>You might object: if <a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably">modern search engines use semantic matching with dense embeddings</a>, how would they perform and show the keyword-style matching in results page seen with conventional keyword engines (e.g. Google Scholar)? </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!DiAj!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!DiAj!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png 424w, https://substackcdn.com/image/fetch/$s_!DiAj!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png 848w, https://substackcdn.com/image/fetch/$s_!DiAj!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png 1272w, https://substackcdn.com/image/fetch/$s_!DiAj!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!DiAj!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png" width="1287" height="623" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:623,&quot;width&quot;:1287,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:103305,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!DiAj!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png 424w, https://substackcdn.com/image/fetch/$s_!DiAj!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png 848w, https://substackcdn.com/image/fetch/$s_!DiAj!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png 1272w, https://substackcdn.com/image/fetch/$s_!DiAj!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed1c060a-dd06-44b0-ac24-6940ee793b91_1287x623.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Interestingly, <a href="https://aarontay.substack.com/p/can-semantic-search-be-more">some newer retrieval models can do something akin to, if not better than, old-style keyword highlighting. Late-interaction and multi-vector systems such as ColBERT, or learnt sparse embedding methods like SPLADE, can expose which terms or passages contributed most to the relevance score, including semantic neighbours in addition to exact lexical matches.</a> In principle, that could support vocabulary growth better than traditional keyword-only ranking, because it can surface terminology matches the student would not have thought to search for. </p><p>Below shows how a ColBERT type search system, highlights terms (both based on exact lexical matches and semantical matches) in the document that contributes the most to the relevancy score.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!WERX!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!WERX!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png 424w, https://substackcdn.com/image/fetch/$s_!WERX!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png 848w, https://substackcdn.com/image/fetch/$s_!WERX!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png 1272w, https://substackcdn.com/image/fetch/$s_!WERX!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!WERX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png" width="634" height="639" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:639,&quot;width&quot;:634,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!WERX!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png 424w, https://substackcdn.com/image/fetch/$s_!WERX!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png 848w, https://substackcdn.com/image/fetch/$s_!WERX!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png 1272w, https://substackcdn.com/image/fetch/$s_!WERX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29a47f26-a97c-4e42-bea2-32f2b6b6eab7_634x639.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><h3><strong>Version two: boundary learning for novices</strong></h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!vxcS!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!vxcS!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png 424w, https://substackcdn.com/image/fetch/$s_!vxcS!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png 848w, https://substackcdn.com/image/fetch/$s_!vxcS!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png 1272w, https://substackcdn.com/image/fetch/$s_!vxcS!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!vxcS!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png" width="1225" height="672" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:672,&quot;width&quot;:1225,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:951292,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!vxcS!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png 424w, https://substackcdn.com/image/fetch/$s_!vxcS!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png 848w, https://substackcdn.com/image/fetch/$s_!vxcS!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png 1272w, https://substackcdn.com/image/fetch/$s_!vxcS!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32fb29cc-a451-498f-91ce-5dc7acb6d16c_1225x672.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The stronger version is about something more specific than vocabulary or effort. It is about the novice&#8217;s need to learn a topic&#8217;s boundaries through exposure to meaningful near-misses and adjacent literatures.</p><p>A novice on a new topic cannot simply search broader, because they do not yet know what broader would mean. They do not know which adjacent areas matter, which terms are near-synonyms, which distinctions are important. For that learner, boundary formation has to happen partly through retrieval itself. Some of what matters may be found not in the core results but in the edge cases.</p><p>This is a fair point, and it is where the informative/uninformative distinction earns its keep.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!_Wuq!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!_Wuq!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png 424w, https://substackcdn.com/image/fetch/$s_!_Wuq!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png 848w, https://substackcdn.com/image/fetch/$s_!_Wuq!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png 1272w, https://substackcdn.com/image/fetch/$s_!_Wuq!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!_Wuq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png" width="1233" height="700" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:700,&quot;width&quot;:1233,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:900089,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!_Wuq!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png 424w, https://substackcdn.com/image/fetch/$s_!_Wuq!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png 848w, https://substackcdn.com/image/fetch/$s_!_Wuq!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png 1272w, https://substackcdn.com/image/fetch/$s_!_Wuq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F953a8d07-b53f-4230-8c5e-19f686281c15_1233x700.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>If the case for &#8220;useful friction&#8221; rests on accidental exposure to meaningful adjacency, then the relevant question is whether poor ranking is a good mechanism for producing it. It is not. Poor ranking by definition generates adjacency mixed indiscriminately with junk. <em>There is no reason to prefer accidental adjacency mixed with lexical noise over a system that retrieves the core accurately and exposes adjacent material deliberately.</em></p><p>A retrieval system that can reliably retrieve works that are not just in your topic but adjacent topics opens a wealth of possibilities to help the user learn! </p><p>An example of what can be done is Undermind&#8217;s adjacent papers feature: a dedicated function that displays <em>papers citing the seminal works of the topic you are researching, despite being judged as falling outside the core topic itself</em><a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-8" href="#footnote-8" target="_self">8</a><em>. </em></p><blockquote><p>Consider the idea of serendipity. When libraries moved physical stacks to remote storage, users complained about losing <em>serendipitous browsing</em>, and they were right that something real was being lost. But the adjacency they valued was <em>not accidental</em>. It came from classification: LC and Dewey were designed to place related works near each other. The well-handled response was not to defend physical stacks at any cost but to build virtual shelf browsing, browse-by-call-number, and related-item interfaces that replicated the function digitally. The function was real and worth preserving; the mechanism changed. The same logic applies here. Adjacency exposure for boundary learning is real and worth preserving. The mechanism should be intentional design (adjacent papers, topic maps, related-citation views), not the accidental side-effects of worse ranking.</p></blockquote><p>This kind of result helps a novice see the edges of a topic and how neighbouring literatures branch from a common core. Topic maps, related-citation views, contrastive recommendations, and &#8220;nearby but different&#8221; clusters can do similar work.  <em>Don&#8217;t look now, but all this needs better retrieval and ranking not worse!</em></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!AgjO!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!AgjO!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png 424w, https://substackcdn.com/image/fetch/$s_!AgjO!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png 848w, https://substackcdn.com/image/fetch/$s_!AgjO!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png 1272w, https://substackcdn.com/image/fetch/$s_!AgjO!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!AgjO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png" width="1456" height="545" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:545,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:63297,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/199420296?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!AgjO!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png 424w, https://substackcdn.com/image/fetch/$s_!AgjO!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png 848w, https://substackcdn.com/image/fetch/$s_!AgjO!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png 1272w, https://substackcdn.com/image/fetch/$s_!AgjO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cc1b30e-53eb-4deb-8b33-4282facbbf77_1576x590.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The table above shows <a href="https://app.undermind.ai/report/836da672ee3b9726c2cefd1f3465a28bd6cf5eb2447a5a9bd5d8c3a538329c3d">&#8220;adjacent works&#8221; identified by Undermind that cite the foundational papers of your topic (In this case - does making papers open access lead to higher citations), but Undermind has judged to be not on your topic</a>. You can see that while it isn&#8217;t perfect, it does show you &#8220;Adjacent&#8221; papers that focus on impact on Open Science, impact of open access on societal impact, influence of funding on open access citation advantage etc. In short, it does some of the &#8220;boundary work&#8221;.</p><p>While I know some users don&#8217;t understand why this feature exists in Undermind as a email alert because they are hyper-focused on their topic,  I find many of the papers surfaced this way interesting.</p><p>As our retrieval and ranking systems get better at surfacing adjacency clusters, exploring and clustering boundaries, we should go beyond simple Chat-style replies with top-five-card summaries or even conventional list style rankings of results<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-9" href="#footnote-9" target="_self">9</a>.  What we need are innovative, dedicated features that assist the searcher in learning about the field they are exploring.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi!</span></a></p><p></p><h2>Conclusion</h2><p>The crude claim collapses on inspection. Poor relevancy ranking that is accidental is not a pedagogical good in itself.</p><p>Topical ranking and pedagogical value can perhaps come apart, particularly for novices who need exposure to topic boundaries, adjacent vocabularies, and the structure of a field. Retrieval is not just a delivery mechanism for known items. It can be part of how a learner forms the map.</p><p>But the conclusion that follows is not a defence of worse ranking. It is that we should stop treating poor ranking as a substitute for thoughtful design. If boundary learning matters, expose adjacent concepts deliberately. If vocabulary formation matters, make semantic neighbours visible. If we care about epistemic diversity, promote multiple tools and multiple ways of traversing a literature.</p><p>Poor ranking is a bad proxy for all of that. The honest response is to design for <em>productive friction explicitly,</em> not to hope mediocre retrieval generates it by accident or use pedagogy reasons as a poor excuse for poor relevancy!</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p></p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>Cognitive load theory</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>Looking back at how well or badly librarianship has reacted to new tools, I suspect experts worrying about the devaluation of their skills is sometimes part of the unspoken story. The other part of the story relates to a lack of appreciation of how newer tools can provide value without entirely replacing all the features of older tools. This will be covered in the third part of my hot-takes series on the history of Google Scholar.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-3" href="#footnote-anchor-3" class="footnote-number" contenteditable="false" target="_self">3</a><div class="footnote-content"><p>In fact, given the explosion of modern search techniques since transformers were invented (compared to before the 2020s, when roughly the same search algorithms were used in academic search), we get extremely different retrieval and ranking results from &#8220;AI search&#8221;, even using the same index. For example, Elicit, Consensus, and Undermind yield very different results despite drawing from roughly the same sources. I will outline my findings from an upcoming presentation at FORCE2026 in a future post.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-4" href="#footnote-anchor-4" class="footnote-number" contenteditable="false" target="_self">4</a><div class="footnote-content"><p><strong>One could argue visible ranking failure</strong> can be pedagogically useful because it reveals the constructed nature of search results. In other words, bad ranking is not useful because it retrieves better learning material; it is useful because it exposes the machinery and teaches the user the concept of algorithmic awareness.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-5" href="#footnote-anchor-5" class="footnote-number" contenteditable="false" target="_self">5</a><div class="footnote-content"><p>The <a href="https://journals.sagepub.com/doi/abs/10.1177/0165551515615841">&#8220;Search-as-Learning&#8221; literature</a> clearly says no to this and argues that for learning, the target may not be maximum topical relevance, but optimised epistemic development: enough relevance to avoid junk, enough diversity to expose boundaries, enough friction to force reflection, and enough transparency to reveal mediation. Refer to this <a href="https://ils.unc.edu/~jarguell/UrgoFNTIR2025.pdf">monograph for an introduction</a>.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-6" href="#footnote-anchor-6" class="footnote-number" contenteditable="false" target="_self">6</a><div class="footnote-content"><p>The strongest objection is not that poor ranking is good. It is that relevance ranking and learning are not the same objective. Search-as-learning research suggests that students learn through reformulation, comparison, metacognitive monitoring, and source integration, not simply through exposure to the most topically relevant documents. So the real risk is not that better ranking removes junk; it is that an overly smooth ranking experience may reduce opportunities for reflection, query experimentation, and awareness of algorithmic mediation. The answer is still not worse ranking, but neither is it ranking alone. It is ranking plus scaffolding, contestability, diversity, and explicit prompts to compare how the system has framed the topic. </p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-7" href="#footnote-anchor-7" class="footnote-number" contenteditable="false" target="_self">7</a><div class="footnote-content"><p>To be fair, whether a irrelevant result is informative or not is highly contextual and not easy to determine sometimes. Similarly, serendipity in information seeking is partly emergent from the searcher&#8217;s context, preparedness, and interpretation, not simply as a system property.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-8" href="#footnote-anchor-8" class="footnote-number" contenteditable="false" target="_self">8</a><div class="footnote-content"><p>Note that Undermind's framing &#8212; "cites the seminal works but judged off-topic" &#8212; is doing real work. The user can see why something is adjacent, not just that it is. A black-box adjacency feature would face the same trust problem as poor ranking, only worse, because users would not even see the messy mix. Legibility of the criterion is part of what makes intentional adjacency defensible.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-9" href="#footnote-anchor-9" class="footnote-number" contenteditable="false" target="_self">9</a><div class="footnote-content"><p>It is no surprise, I don&#8217;t agree with Emily M. Bender style beliefs that LLMs are &#8220;stochastic parrots&#8221; and hence can never be useful for anything much including search but<a href="https://dl.acm.org/doi/epdf/10.1145/3498366.3505816"> 2020&#8217;s Situating Search</a> is clearly correct that there are many information seeking needs and we need diversity in search tools beyond just conversational interfaces or even ranking lists.</p></div></div>]]></content:encoded></item><item><title><![CDATA[[Hot Take] AI Academic Search and the Missing Middle of Literature Discovery]]></title><description><![CDATA[Is overly focusing on Undergraduate information literacy and evidence synthesis making us underestimate AI academic search tools?]]></description><link>https://aarontay.substack.com/p/ai-academic-search-and-the-missing</link><guid isPermaLink="false">https://aarontay.substack.com/p/ai-academic-search-and-the-missing</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Mon, 25 May 2026 19:17:36 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!80a7!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!80a7!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!80a7!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png 424w, https://substackcdn.com/image/fetch/$s_!80a7!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png 848w, https://substackcdn.com/image/fetch/$s_!80a7!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png 1272w, https://substackcdn.com/image/fetch/$s_!80a7!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!80a7!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png" width="1456" height="813" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:813,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:2541068,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!80a7!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png 424w, https://substackcdn.com/image/fetch/$s_!80a7!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png 848w, https://substackcdn.com/image/fetch/$s_!80a7!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png 1272w, https://substackcdn.com/image/fetch/$s_!80a7!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb1fa6744-ef93-4505-8cb1-927014a1c482_1678x937.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em>This post is part of a &#8220;hot takes&#8221; series in which I make sharper claims than I usually do. I do not intend to offend, and I am not trying to tar every librarian with the same brush &#8212; the patterns I describe and perceive may be a function of my own local context. But I am sure some of what I write will resonate. Besides, I think librarianship advances by naming what could be better, not by pretending everything is fine.</em></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p><strong>TLDR:</strong>  AI search tools may look unimpressive when judged mainly through the two most visible library search frameworks: undergraduate information literacy and evidence synthesis. But their strongest current use case may be a third one: ordinary narrative literature reviews also often called Scholarly Discovery, where librarianship&#8217;s voice is less visible than it should be.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi!</span></a></p><p>I keep running into librarians, in conversation and online, who say they have tried AI search tools and come away unimpressed. They do not really see what the fuss is about.</p><p>Some of this reaction is fair. The category &#8220;AI search&#8221; is broad, and a fair amount of what gets sold under that label is underwhelming.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!sgot!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!sgot!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png 424w, https://substackcdn.com/image/fetch/$s_!sgot!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png 848w, https://substackcdn.com/image/fetch/$s_!sgot!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png 1272w, https://substackcdn.com/image/fetch/$s_!sgot!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!sgot!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png" width="1256" height="703" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:703,&quot;width&quot;:1256,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1194504,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!sgot!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png 424w, https://substackcdn.com/image/fetch/$s_!sgot!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png 848w, https://substackcdn.com/image/fetch/$s_!sgot!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png 1272w, https://substackcdn.com/image/fetch/$s_!sgot!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ed48076-fc66-4f5c-8cfc-ffcbdbbd7059_1256x703.png 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>At its weakest it runs thin LLM wrappers that translate a natural-language query into a Boolean string and then run it over the same lexical search engine underneath. I have previously called this the <a href="https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search">horseless carriage of AI search</a>: using new technology to reproduce the shape of the old system rather than rethinking the system itself. </p><p>Without radically rethinking retrieval and ranking (e.g. <a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably">Semantic search via dense embeddings</a>, <a href="https://hornet.dev/blog/this-is-what-agentic-retrieval-looks-like">iterative agentic search</a> etc), the ceiling on improvement will be low.   </p><p>Several library vendors now ship tools of this kind &#8212; Scopus AI, Web of Science Research Assistant, Primo Research Assistant, EBSCOhost Natural Language Search, and others. They use a powerful new technology to reproduce an old artefact, without addressing the ranking-stage problems that make academic search frustrating in the first place<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a>. If a librarian&#8217;s exposure to &#8220;AI search&#8221; is mostly tools of this sort, writing off the category is understandable.</p><p>But the reaction I want to focus on is different. It is the dismissal that extends even to the better AI search tools: <a href="http://undermind.ai">Undermind</a>, <a href="http://elicit.com">Elicit</a>, <a href="https://asta.allen.ai/discover?redirect_from=paper-finder">Asta Paper Finder</a>, <a href="http://Consensus.app">Consensus</a>, and others that are not simply trying to make Boolean search friendlier but are attempting more radical changes to retrieval and ranking.</p><blockquote><p>I will keep talking about &#8220;better AI search tools&#8221; throughout this essay and you might be wondering what I mean, since there are <a href="https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered">many types of Academic AI search</a> with different &#8220;AI&#8221; techniques and architectures used to accomplish different functions. </p><p>Clearly, systems ONLY based on <a href="https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search">horseless carriage AI search techniques</a> are unlikely to do much better but can we say anything more positive here?</p><p>While there are no guarantees, I would suggest that academic AI search tools that fall into the<a href="https://aarontay.substack.com/p/why-i-think-academic-deep-research#:~:text=Top%2Dright%20(Deep,evaluate%20relevancy%20well."> &#8220;Deep Search&#8221; and &#8220;Deep Research&#8221; type of search tools</a>, should more often than not, give clearly superior retrieval and ranking for &#8220;difficult queries&#8221; compared to traditional Boolean retrieval but basic TF-IDF/BM25 ranking. But if you need one tool to point at that I consider  a &#8220;better AI seach tool&#8221; - I would consider Undermind.ai as an example<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>.</p></blockquote><p>In my own testing <a href="https://aarontay.substack.com/p/better-ai-search-rubrics-roles-gates#:~:text=Still%2C%20I%20want,return%20something%20plausible.">particularly for difficult queries</a>, the difference is often visible in the first screen of results: the better AI search tools place relevant work high in the ranking, while conventional databases often require more query reformulation and screening before comparable papers appear. </p><p>For example, I recently ran a study on reproducibility, running the same query five times across multiple AI search engines. It was not even meant to compare AI search engines relevancy but even with a broad query that had 200+ possible relevant results, only Undermind maintained high precision down to rank 50. </p><p>Other respected AI search tools could barely manage this for the top 10 to 20, showing the variance in performance. For &#8220;hard queries&#8221; the difference was even more stark between AI search tools and conventional databases.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Pv09!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Pv09!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png 424w, https://substackcdn.com/image/fetch/$s_!Pv09!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png 848w, https://substackcdn.com/image/fetch/$s_!Pv09!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png 1272w, https://substackcdn.com/image/fetch/$s_!Pv09!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Pv09!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png" width="1351" height="759" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:759,&quot;width&quot;:1351,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1242861,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Pv09!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png 424w, https://substackcdn.com/image/fetch/$s_!Pv09!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png 848w, https://substackcdn.com/image/fetch/$s_!Pv09!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png 1272w, https://substackcdn.com/image/fetch/$s_!Pv09!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3e90d197-27b2-4d11-8e20-7431b9743a22_1351x759.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p style="text-align: center;"><em>The diagram above is just illustrative</em></p><p>I would not be as confident in this if it were only my own assessment, but feedback from PhD students and faculty has been<em> overwhelmingly positive with continued heavy sustained use of Undermind.ai</em><a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-3" href="#footnote-3" target="_self">3</a>. Comments like &#8220;if you do not renew the subscription, I will pay for it myself&#8221; are common. </p><p>To be clear, we are not talking about Cochrane-grade recall here, and these tools do not exhaust the literature. Their strength is not formal exhaustiveness, but top-N relevance: for focused topics, they often put more useful papers into the first 10, 20, or 50 results than conventional database searches.</p><p>But this post isn&#8217;t just about Undermind.ai, there are quite a few in my view (pretty much any type of Deep Search or Deep Research) that are almost as good.</p><p>So the question is: given that the better AI search tools often deliver much stronger early precision and better practical discovery for focused scholarly questions, especially when judged by the relevance of the top 10 to 50 results., and many researchers plainly value this, why do some librarians still not see it?</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!AsXE!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!AsXE!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png 424w, https://substackcdn.com/image/fetch/$s_!AsXE!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png 848w, https://substackcdn.com/image/fetch/$s_!AsXE!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png 1272w, https://substackcdn.com/image/fetch/$s_!AsXE!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!AsXE!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png" width="1186" height="609" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:609,&quot;width&quot;:1186,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:899096,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!AsXE!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png 424w, https://substackcdn.com/image/fetch/$s_!AsXE!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png 848w, https://substackcdn.com/image/fetch/$s_!AsXE!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png 1272w, https://substackcdn.com/image/fetch/$s_!AsXE!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2cce51ec-313b-4315-9325-42b03742ac7c_1186x609.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Leaving aside <a href="https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered">the usual anti-AI reasons</a> and focusing on the effectiveness angle, my best guess is that librarians who teach or support search often evaluate AI search tools through one of two existing professional lenses: undergraduate information literacy and evidence synthesis. Neither lens is well-suited to what the better AI search tools currently do best. The use case where these tools genuinely shine, the ordinary narrative review, sits in a third space that the profession has generally paid less attention to.  </p><div class="captioned-button-wrap" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/ai-academic-search-and-the-missing?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="CaptionedButtonToDOM"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! This post is public so feel free to share it.</p></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/ai-academic-search-and-the-missing?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/p/ai-academic-search-and-the-missing?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p></div><h3>Lens 1: Information literacy for undergraduates</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!dt4c!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!dt4c!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png 424w, https://substackcdn.com/image/fetch/$s_!dt4c!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png 848w, https://substackcdn.com/image/fetch/$s_!dt4c!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png 1272w, https://substackcdn.com/image/fetch/$s_!dt4c!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!dt4c!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png" width="1244" height="706" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:706,&quot;width&quot;:1244,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:954370,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!dt4c!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png 424w, https://substackcdn.com/image/fetch/$s_!dt4c!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png 848w, https://substackcdn.com/image/fetch/$s_!dt4c!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png 1272w, https://substackcdn.com/image/fetch/$s_!dt4c!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f33d9be-9fae-45ca-bf26-ff25d91fc5b8_1244x706.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The first lens is the information literacy(IL) lens, often focused on undergraduate learning.</p><p>Information literacy specialists will rightly remind me that IL for undergraduates is not the reductive &#8220;teach students to find five peer-reviewed papers for an assignment.&#8221; At its best, IL teaching helps students understand how information systems work, how authority is constructed, how disciplinary knowledge is produced, how databases and search engines shape what becomes visible, and how inquiry develops over time. Searching is not just a mechanical act of retrieval (Searching as Strategic Exploration!<strong>)</strong>. It is part of learning how knowledge is organised, contested, and evaluated.</p><p>That said, the stereotype exists for a reason. A large amount of undergraduate IL instruction is still tied to assignment support: helping students find a handful of credible scholarly sources for essays. The librarian may want to teach richer concepts, but the immediate student need is often narrow.</p><p>This is exactly the use case where higher precision and recall do not matter much. A student writing a 2,000-word essay does not need exhaustive recall. They need enough credible sources of a common topic (of which there are many) to support a basic argument, and almost any decent academic database can supply that. JSTOR, ProQuest, EBSCOhost, Scopus, Google Scholar, or the library discovery layer will usually produce something usable. Better ranking helps, but rarely transforms the outcome.  </p><p>In short, if the dominant teaching use case is helping undergraduates find &#8220;some good enough sources,&#8221; then the value of a tool that produces a much stronger top-10 or top-20 ranked list may not be obvious. The existing tools already clear the bar.</p><h4>The pedagogical argument</h4><p>There&#8217;s a deeper issue. </p><p>If the goal is simply to help students obtain relevant sources quickly, then better ranking is an obvious win. But if, as a information literacy librarian your goal is to help students understand the process of searching, e.g how keywords fail, how databases differ, how controlled vocabularies work<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-4" href="#footnote-4" target="_self">4</a>, then an AI tool that quietly produces a good ranked list with no effort from the searcher  is <em>arguably even worse for this purpose!</em></p><p>From that perspective, poor relevance ranking is not really a bug to be designed away. In a sense it is closer to a feature, because it creates the conditions in which these skills become necessary and therefore teachable. A student whose first search returns exactly what they want does not learn anything transferable about searching. A tool that does the work for the user implicitly devalues the skills the librarian is trying to develop, and so its strengths might register as threats rather than wins.</p><p>After all friction is pedagogically useful and one could even argue better search results removes friction! </p><blockquote><p>At this point, we can consider if all friction is useful for learning and whether the reduced friction from better search ranking is &#8220;useful friction&#8221;. My next post will address this interesting topic.</p></blockquote><p>This orientation may also help explain a pattern in some librarian-led AI search evaluation frameworks often designed by IL librarians. Retrieval effectiveness tends to be folded into a long list of weighted criteria alongside ease of use, transparency, accessibility, currency, and ethics. As I have argued in a <a href="https://aarontay.substack.com/p/better-ai-search-rubrics-roles-gates">recent post on AI search rubrics</a>, retrieval should instead be treated as a gating criterion: if a tool cannot find the relevant literature, the other criteria do not rescue it, because surfacing relevant literature is the thing the tool exists to do.</p><p> </p><h4>Lens 2 : Evidence Synthesis </h4><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Qrgw!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Qrgw!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png 424w, https://substackcdn.com/image/fetch/$s_!Qrgw!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png 848w, https://substackcdn.com/image/fetch/$s_!Qrgw!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png 1272w, https://substackcdn.com/image/fetch/$s_!Qrgw!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Qrgw!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png" width="1252" height="706" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:706,&quot;width&quot;:1252,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1451879,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Qrgw!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png 424w, https://substackcdn.com/image/fetch/$s_!Qrgw!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png 848w, https://substackcdn.com/image/fetch/$s_!Qrgw!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png 1272w, https://substackcdn.com/image/fetch/$s_!Qrgw!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39a339f6-1124-4f17-a765-f339a30c057c_1252x706.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The second lens is evidence synthesis: systematic reviews, scoping reviews, and meta-analyses. From this vantage point, the gold standard is near-exhaustive recall with documented and reproducible search strategies. Most AI search tools, even the best ones, do not deliver this by design<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-5" href="#footnote-5" target="_self">5</a>.</p><blockquote><p>Why not just ask an LLM for a Boolean search strategy? <a href="https://app.undermind.ai/report/8f6940b18b8a7c8bbf5ee1b080dde713fe492b976f0be4c8ebfaa15235e42a24">Plenty of literature since 2023</a> shows that prompting LLMs to generate Boolean strings produces poor results. <a href="https://arxiv.org/abs/2602.00005">Fine-tuning helps moderately</a>. My current view is that a better way to approach acceptable quality is to give an agentic LLM access to PubMed and the MeSH browser and let it pilot-test the search the way a human searcher does. You can see my early attempt at <a href="http://ACoAAADydNkB8cFBZ48tGuFjE4yHqQ6N6mBWEyE">building a Claude skill</a> along these lines.</p></blockquote><p>Beyond that, LLM-driven search is not deterministic, and you cannot publish a systematic review whose search step is &#8220;I asked Undermind.&#8221; From this lens, AI search is at best a supplement and at worst a distraction.</p><blockquote><p>There are of course specialised AI search tools designed specifically for evidence synthesis. On one hand are those built on pre-LLM machine learning techniques, such as <a href="https://asreview.nl/">ASReview</a> and <a href="https://www.covidence.org/">Covidence</a>, which rely mostly on active learning and supervised classifiers for screening prioritisation. </p><p>On the other hand, a growing number of LLM-native entrants have appeared, including those highlighted in <a href="https://www.cochrane.org/about-us/news/cochrane-announces-selected-ai-tools-innovative-platform-study">Cochrane's recent announcement of selected AI tools for its innovative platform study</a>. The boundary is blurring, however. Established players like Covidence, Rayyan, and DistillerSR have been retrofitting LLM features onto what were originally classical ML workflows.</p><p>These newer LLM-native tools are very new and largely untested. Within the systematic review community, established tools like Rayyan and Covidence are well known, but the recent LLM-first entrants remain unfamiliar even to most specialists. <a href="https://elicit.com/">Elicit</a> is perhaps the most mainstream LLM-native tool to enter this space, and recently <a href="https://elicit.com/blog/systematic-review-for-prisma-2020">claimed support for "PRISMA 2020 guidelines, making it reproducible, traceable, and auditable at every step"</a><a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-6" href="#footnote-6" target="_self">6</a>. </p><p>But notice what Elicit and similar tools actually do. Even they apply LLMs mostly to screening, deduplication, data extraction, and maybe risk-of-bias assessment, while leaving the actual search step to standard Boolean queries on PubMed. That tells us something important: high-recall search is still a hard problem for modern retrieval techniques<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-7" href="#footnote-7" target="_self">7</a>.</p></blockquote><p>This is not irrational. For evidence synthesis, high recall is non-negotiable. If your professional frame is systematic review support, then a tool with excellent precision but uncertain recall will naturally look insufficient.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!p1aR!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!p1aR!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png 424w, https://substackcdn.com/image/fetch/$s_!p1aR!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png 848w, https://substackcdn.com/image/fetch/$s_!p1aR!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png 1272w, https://substackcdn.com/image/fetch/$s_!p1aR!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!p1aR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png" width="1249" height="706" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:706,&quot;width&quot;:1249,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:848435,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!p1aR!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png 424w, https://substackcdn.com/image/fetch/$s_!p1aR!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png 848w, https://substackcdn.com/image/fetch/$s_!p1aR!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png 1272w, https://substackcdn.com/image/fetch/$s_!p1aR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d7b478-fa14-4846-a88f-ec461063bd36_1249x706.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>So if these two lenses are all you have, AI search tools look unimpressive twice over. They are unnecessary, or even harmful, for the basic undergraduate case. They are not good enough for the systematic review case.</p><p> </p><h2>A view from outside the profession</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ry1t!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ry1t!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png 424w, https://substackcdn.com/image/fetch/$s_!ry1t!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png 848w, https://substackcdn.com/image/fetch/$s_!ry1t!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png 1272w, https://substackcdn.com/image/fetch/$s_!ry1t!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ry1t!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png" width="774" height="458" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:458,&quot;width&quot;:774,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:484263,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ry1t!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png 424w, https://substackcdn.com/image/fetch/$s_!ry1t!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png 848w, https://substackcdn.com/image/fetch/$s_!ry1t!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png 1272w, https://substackcdn.com/image/fetch/$s_!ry1t!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a2c441e-9d22-44ff-ba82-6c13eb93c860_774x458.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>A recent <a href="https://youtu.be/vzMeBNwSd2Y">video by John Frechette, the CEO of Moara</a> is worth watching here, partly because it reaches conclusions similar to mine but from an outsider&#8217;s vantage point. He makes two observations, both of which I think are largely correct, and the second of which I expect more librarians to push back on.</p><blockquote><p>You might suspect bias as he runs a commercial AI research platform. But <a href="http://moara.io">Moara</a> is not mainly a search engine. It is closer to a next generation reference manager or an AI-infused evidence synthesis workspace, somewhat like Covidence with more aggressive LLM use, helping researchers collect, screen, and synthesise sources from anywhere: Google Scholar, Undermind, Claude, conventional databases, PDFs, reference managers. In that sense, Moara is source-agnostic, and John has little incentive to favour one search tool over any (he tends to praise Undermind and using Claude search outright in his demos).</p></blockquote><p>First, he criticises the standard framing from some libguides of literature search as &#8220;pick a database, run your search, you are done.&#8221; He is right that this is misleading. Top-10 and top-20 overlap across major academic search engines is much smaller than this framing implies, and evidence synthesis methodology has long acknowledged that no single source has comprehensive coverage of any non-trivial broad topic. Though in fairness, many libguides are aimed at undergraduates who are not doing the level of formal review John has in mind.</p><p>Second, and more controversially, he notes that many university-recommended discipline-specific databases produced worse results than Google Scholar or Undermind, and that even IDEAS, despite his topic being in economics, returned irrelevant results past the first ten hits. <em>Some librarians will take offence at this. I will say it plainly: I think he is right.  </em></p><p>For many difficult, exploratory, or poorly lexicalised scholarly queries, the top-ranked results in conventional academic databases can be noticeably weaker than those from Google Scholar or newer deep-search tools like Undermind, Asta Paper Finder, or Consensus. This is not a knock on the metadata quality of those discipline-specific databases, which is often excellent. But ranking is a separate problem from coverage, and ranking is increasingly where the bottleneck sits. Discipline-specific databases optimised for Boolean retrieval over rich metadata were not built around powerful semantic or agentic/iterative pipelines modern AI search uses, and it shows.</p><p>To his credit, John does not argue you should ditch every database for one single AI search, no matter how good. He explicitly says one source is never enough. The point is not &#8220;AI search wins, traditional databases lose.&#8221; The point is that ranking quality varies, and a tool that reliably surfaces relevant work in its top 10/20/50 is doing something traditional databases often fail at.</p><p>  </p><h2>The missing middle: narrative reviews</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!HJO0!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!HJO0!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png 424w, https://substackcdn.com/image/fetch/$s_!HJO0!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png 848w, https://substackcdn.com/image/fetch/$s_!HJO0!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png 1272w, https://substackcdn.com/image/fetch/$s_!HJO0!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!HJO0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png" width="1248" height="710" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:710,&quot;width&quot;:1248,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1205306,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!HJO0!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png 424w, https://substackcdn.com/image/fetch/$s_!HJO0!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png 848w, https://substackcdn.com/image/fetch/$s_!HJO0!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png 1272w, https://substackcdn.com/image/fetch/$s_!HJO0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad77c82a-b9bb-4099-aef4-99c47204703b_1248x710.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>What both the information literacy and evidence synthesis lenses can miss is probably the most common literature search scenario in academia: the ordinary scholarly literature review, often known as scholarly discovery.</p><p>Most academics writing the literature review section of a paper, a thesis, a grant application, or a book chapter are not doing systematic reviews. </p><p>Don&#8217;t get me wrong, they still need to demonstrate command of the relevant literature, identify the key debates and findings, and situate their own contribution. They want practical coverage and recall: enough confidence that they have not missed the main debates, methods, authors, and findings, combined with high precision because their time is finite and reading irrelevant papers is expensive.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!p-z9!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!p-z9!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png 424w, https://substackcdn.com/image/fetch/$s_!p-z9!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png 848w, https://substackcdn.com/image/fetch/$s_!p-z9!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png 1272w, https://substackcdn.com/image/fetch/$s_!p-z9!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!p-z9!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png" width="1456" height="823" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c941250-546f-43dc-910b-179a3d859981_1668x943.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:823,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1312016,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!p-z9!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png 424w, https://substackcdn.com/image/fetch/$s_!p-z9!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png 848w, https://substackcdn.com/image/fetch/$s_!p-z9!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png 1272w, https://substackcdn.com/image/fetch/$s_!p-z9!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4c941250-546f-43dc-910b-179a3d859981_1668x943.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This is exactly the niche where the better AI search tools deliver the most value. Undermind, Asta Paper Finder, and Consensus (either alone or more likely in combination with other tools) in my testing tend to produce a tightly relevant result set with strong precision in the top ranks, at the cost of not exhausting the long tail. For a narrative review, that tradeoff is excellent. For a systematic review, it is insufficient on its own. For a freshman essay, it is overkill.</p><p>When I look at which researchers most enthusiastically adopt these tools, it is overwhelmingly people doing narrative reviews. That is not a coincidence.</p><h2>The missing or less visible third camp</h2><p>I am not saying no librarian cares about this use case (I exist!). The line between supporting &#8220;undergraduate find 5 peer review articles&#8221; and supporting researchers on capstone or thesis work is thin, and plenty of academic librarians do both. There is a long history of domain-informed, researcher-facing discovery support: the subject specialist (or Reference librarian or Digital Scholarship librarian) helping a researcher navigate a field, identify important work, trace debates, follow citations, recognise key authors, and avoid obvious blind spots will definitely benefit from a strong AI search tool along these lines.</p><p>But my thesis is that in the librarian profession today, search support has become most publicly legible and focused into two areas<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-8" href="#footnote-8" target="_self">8</a>. On one side is undergraduate IL. On the other is evidence synthesis, especially in health sciences. Between them sits the ordinary working researcher: the faculty member, PhD student, postdoc, policy researcher, or grant writer who is not doing a systematic review, but still needs better literature discovery than a basic database search provides.</p><p>If librarians do not make themselves visible in that space, researchers will not wait (they already aren&#8217;t). They will use Undermind, Elicit, Consensus, Asta Paper Finder<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-9" href="#footnote-9" target="_self">9</a>, Google Scholar, Claude, ChatGPT, Semantic Scholar, Research Rabbit, Connected Papers, citation alerts, PDFs from colleagues, and whatever else works. They will build their own messy discovery workflows, with or without us.</p><p>A renewed third camp would not <a href="https://aarontay.substack.com/p/were-good-at-search-just-not-the">treat AI search as magic</a>. People in this camp would also not dismiss it because it fails systematic review standards or complicates undergraduate pedagogy. They would evaluate these tools the way subject specialists have always evaluated search tools: by asking whether they can surface important, relevant, and useful literature for real research questions. That camp would be willing to say:</p><ul><li><p>An AI search tool can be imperfect and still useful.</p></li><li><p>A tool can be unsuitable for systematic reviews and still valuable for researchers.</p></li><li><p>A tool can lack full transparency and still deserve attention if its retrieval performance is strong.</p></li><li><p>A tool should not be recommended just because it is easy to use, ethical, accessible, or institutionally licensed if it has sub-par retrieval ranking</p></li><li><p><em>A tool should first be judged by whether it finds relevant literature for the task at hand. Only after that should we ask the other questions.</em></p></li></ul><p> This is not an argument for ignoring privacy, ethics, accessibility, transparency, or sustainability. Those matter. But they should not be used to avoid the retrieval question. If a search tool does not search well, it has failed at its primary task.</p><p>The deeper point is not that librarianship has never occupied this middle territory. It has. The point is that this role needs to become more visible again in the age of AI search. The third camp does not need to be invented from scratch. It needs to be recovered, updated, and have a larger voice at the table.</p><p>     </p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi!</span></a></p><p></p><h2>Conclusion</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!4Dbh!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!4Dbh!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png 424w, https://substackcdn.com/image/fetch/$s_!4Dbh!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png 848w, https://substackcdn.com/image/fetch/$s_!4Dbh!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png 1272w, https://substackcdn.com/image/fetch/$s_!4Dbh!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!4Dbh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png" width="1055" height="1491" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1491,&quot;width&quot;:1055,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1349810,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/196200309?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!4Dbh!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png 424w, https://substackcdn.com/image/fetch/$s_!4Dbh!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png 848w, https://substackcdn.com/image/fetch/$s_!4Dbh!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png 1272w, https://substackcdn.com/image/fetch/$s_!4Dbh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b78f836-d508-4caf-89b9-e9d1c2ec192f_1055x1491.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>To summarise the use cases:</p><ul><li><p><strong>Freshman undergraduate work</strong>: mid-to-high precision, recall does not need to be high. Almost any database with the right coverage will do.</p></li><li><p><strong>Evidence synthesis</strong>: high recall is non-negotiable, and you accept whatever precision you can get. Multiple sources, documented strategies, traditional databases plus maybe AI tools as supplements.</p></li><li><p><strong>Narrative reviews</strong>: moderate recall for the time spent, high early precision, and strong top-ranked relevance. This is where the better AI search tools sit, and it is the use case where librarian voices are thinnest.</p></li></ul><p>The smarter evidence synthesis librarians have already figured out that there is nothing preventing them from using Undermind as one source among many in a multi-source strategy, and I have seen several publicly endorse this approach. That is exactly right. But the deeper move the profession still needs to make is to recognise that the narrative review may be a use case underserved by the loudest professional voices&#8230;.</p><div class="captioned-button-wrap" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/ai-academic-search-and-the-missing?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="CaptionedButtonToDOM"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! This post is public so feel free to share it.</p></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/ai-academic-search-and-the-missing?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/p/ai-academic-search-and-the-missing?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>To be fair, some of these tools don&#8217;t <em>just</em> use LLM to generate nested Boolean, but also do hybrid search and powerful reranking systems (e.g. see my <a href="https://katinamagazine.org/content/article/reviews/2025/deep-dive-into-three-ai-academic-search-tools">reviews of Scopus AI, Primo Research Assistant</a>) which can lead to bigger improvements but in general quite a few tools rely just on or mainly on LLM to generate Boolean search strings which will have limited room for improvement.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>I know it sounds like I am gushing too much about Undermind.ai. <em>But it is good</em>. Some other data points. <a href="https://bsky.app/profile/aarontay.bsky.social/post/3mf5pplbivk2t">Farhad Shokraneh, a highly respected evidence synthesis expert has praised Undermind many times in his webinars for exploratory search</a>. So has <a href="https://www.youtube.com/watch?v=W_DylhnBR30">John Frechette, CEO of Moara</a>. Most independent testing of AI search tools for pure relevancy which I have seen (which unfortunately tends to be rare and often somewhat poor quality) shows Undermind on top (<a href="https://www.researchgate.net/publication/396120553_Do_AI_research_assistants_live_up_to_their_hype_An_Exploratory_Study_of_Some_Freely_Available_Tools">here</a>,<a href="https://bsky.app/profile/aarontay.bsky.social/post/3mf5pplbivk2t"> here</a>, <a href="https://www.tandfonline.com/doi/abs/10.1080/15424065.2025.2546052">here</a>) and if not second (if the tester has a dog in the fight e.g. <a href="https://elicit.com/blog/elicit-reports-eval/">here</a>, <a href="https://publications.mpi-cbg.de/Jain_2024_8866.pdf#page=1.87">here</a>). It has weaknesses of course, e.g. it&#8217;s index covers only articles, so even Primo Research Assistant can be competitive if the test set query requires non-scholarly articles and/or <a href="https://bsky.app/profile/aarontay.bsky.social/post/3mf4qdvm5os2t">Claude can beat it by finding relevant grey literature.</a></p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-3" href="#footnote-anchor-3" class="footnote-number" contenteditable="false" target="_self">3</a><div class="footnote-content"><p>In case you are wondering, they (faculty and Phd students) do not react this way to all AI search tools (and we trialed a lot from 2024-2025).</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-4" href="#footnote-anchor-4" class="footnote-number" contenteditable="false" target="_self">4</a><div class="footnote-content"><p>When I demo search tools, I don&#8217;t prep my queries in advance much. But I am not above showing certain queries, knowing that they typically gives me opportunities to show off other features. In theory, a very good search result will reduce such opportunities.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-5" href="#footnote-anchor-5" class="footnote-number" contenteditable="false" target="_self">5</a><div class="footnote-content"><p>It seems to me that the traditional systematic review method &#8212; search broadly with Boolean strategies, within reason, then screen the retrieved set &#8212; remains hard to beat for high-recall evidence identification. It is essentially a controlled brute-force approach: instead of trusting the retrieval system to decide what matters, it shifts the burden to transparent over-retrieval and human screening.</p><p>In theory, advanced agentic search might match or beat it if you were willing to set aside reproducibility and interpretability.  </p><p>The deeper issue is that the main information retrieval field is not really working on this problem as much. <a href="https://x.com/lateinteraction/status/2043053506504925588">Mainstream IR evaluation today is more focused toward multi-hop QA and hard needle-in-haystack benchmarks like BEIR, HotpotQA, and BrowseComp plus, all of which reward finding the one document that answers the query rather than finding everything on a topic.</a>  </p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-6" href="#footnote-anchor-6" class="footnote-number" contenteditable="false" target="_self">6</a><div class="footnote-content"><p>Of course, PRISMA 2020 is a reporting guideline, not a search methodology&#8230;..</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-7" href="#footnote-anchor-7" class="footnote-number" contenteditable="false" target="_self">7</a><div class="footnote-content"><p>See footnote 5</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-8" href="#footnote-anchor-8" class="footnote-number" contenteditable="false" target="_self">8</a><div class="footnote-content"><p>I have the impression my blog is read mainly by information literacy librarians, librarians/researchers into evidence synthesis and the odd Library Systems person. Workshops I have conducted are about 50-50 in the first two camps.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-9" href="#footnote-anchor-9" class="footnote-number" contenteditable="false" target="_self">9</a><div class="footnote-content"><p>Two weeks after AI PaperFinder launched, a faculty was telling me he already was using it because he heard from his peers it was good. He&#8217;s an exception, a early adopter but we should not underestimate how fast good research tools are adopted via word of mouth without librarians even hearing about it.</p></div></div>]]></content:encoded></item><item><title><![CDATA[Better AI Search Rubrics: Roles, Gates, and Retrieval Tests]]></title><description><![CDATA[Some suggestions on how to construct AI search evaluation frameworks]]></description><link>https://aarontay.substack.com/p/better-ai-search-rubrics-roles-gates</link><guid isPermaLink="false">https://aarontay.substack.com/p/better-ai-search-rubrics-roles-gates</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Wed, 29 Apr 2026 17:01:02 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!0iE4!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!0iE4!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!0iE4!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png 424w, https://substackcdn.com/image/fetch/$s_!0iE4!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png 848w, https://substackcdn.com/image/fetch/$s_!0iE4!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png 1272w, https://substackcdn.com/image/fetch/$s_!0iE4!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!0iE4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png" width="1456" height="813" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/971676cb-beff-4206-a141-17ded15d575c_1678x937.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:813,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1983900,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!0iE4!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png 424w, https://substackcdn.com/image/fetch/$s_!0iE4!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png 848w, https://substackcdn.com/image/fetch/$s_!0iE4!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png 1272w, https://substackcdn.com/image/fetch/$s_!0iE4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F971676cb-beff-4206-a141-17ded15d575c_1678x937.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi!</span></a></p><p>Whenever I give workshops or talks on AI search tools, someone eventually asks whether I have or recommend an evaluation framework or matrix for AI search tools.</p><p>I have been hesitant to give a firm answer. I know a thing or two about AI search, but I have much less experience, and frankly less interest, in building formal evaluation frameworks. Still, evaluation frameworks are a serious thread in information literacy, collection assessment, and procurement. The demand for them is real.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!MO1v!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!MO1v!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png 424w, https://substackcdn.com/image/fetch/$s_!MO1v!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png 848w, https://substackcdn.com/image/fetch/$s_!MO1v!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png 1272w, https://substackcdn.com/image/fetch/$s_!MO1v!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!MO1v!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png" width="546" height="583" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:583,&quot;width&quot;:546,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:340857,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!MO1v!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png 424w, https://substackcdn.com/image/fetch/$s_!MO1v!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png 848w, https://substackcdn.com/image/fetch/$s_!MO1v!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png 1272w, https://substackcdn.com/image/fetch/$s_!MO1v!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F51d19aef-d01f-49c1-a5f1-27a656cd3284_546x583.png 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>My worry is that many evaluation matrices try to do too much at once. They aim to be universal. They give every criterion a score. They weight too many things equally. They also rely heavily on qualitative impressions, including for the thing that matters most when evaluating search tools: whether the tool can retrieve and rank useful material.</p><p>To put my argument more clearly: AI search evaluation frameworks should not produce a single universal score at least not for everybody. They should specify the user role and task, identify non-negotiable gates, and test the most important claims empirically. For AI search tools, retrieval quality should be a core task-performance gate. If a tool cannot reliably retrieve and rank useful material for realistic queries, its interface, citation export, and administrative features are secondary.</p><p>That does not mean retrieval is the only non-negotiable gate. For institutional procurement, there may be other hard gates: privacy, accessibility, licence terms, data retention, security, local compliance requirements, and so on. A tool that fails those may be unacceptable regardless of how good its retrieval is. My point is narrower. Once we are evaluating something as a search tool, retrieval should not be treated as just one ordinary category among many.</p><p>In <a href="https://aarontay.substack.com/p/ai-academic-search-needs-better-frameworks">my last post</a>, I mentioned two librarian-led projects that implemented AI search evaluation frameworks, both coincidentally vibe-coded using Claude and both drawing at least partly on my work. <a href="https://omnomdombomb.github.io/ai_evaluation_framework_tool/AI-Tool-Assessment-Framework.html">One was by Wang Huajin and the team at Carnegie Mellon</a>, and <a href="https://aarontay.substack.com/p/ai-academic-search-needs-better-frameworks#:~:text=Mellon%2C%20and-,Alfred%20Wallace%20at%20the%20University%20of%20North%20Dakota,-each%20built%20something">the other by Alfred Wallace at the University of North Dakota</a>.</p><p>Both are good. More than good, actually. They show a relatively sophisticated understanding of how AI search tools differ. For example, they distinguish between tools that merely use an LLM to generate Boolean queries, tools that add reranking, tools that combine lexical and semantic retrieval, and tools that orchestrate multi-step agentic searches. That is already a step above treating &#8220;AI search&#8221; as a single homogeneous category.</p><p>Still, no framework is perfect. In this post, I want to suggest three improvements that could make AI search evaluation frameworks, including other existing ones like <a href="https://digitalcommons.lmu.edu/cgi/viewcontent.cgi?article=1171&amp;context=librarian_pubs">the REACT (Relevancy, Ease of Use, Assessing DEIA, Currency, Transparency &amp; Accuracy) framework</a><a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a>, more useful for libraries:  </p><ol><li><p>Be explicit about whose needs the framework serves.</p></li><li><p>Treat retrieval capability as a gating criterion, not just one category among many.</p></li><li><p>Replace some qualitative judgements with lightweight empirical tests.</p></li></ol><p>None of these suggestions are novel in isolation. But I think putting them together would make these frameworks more practical and more honest.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/better-ai-search-rubrics-roles-gates?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/p/better-ai-search-rubrics-roles-gates?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p><p></p><h2>1. Evaluation matrices should be clear about who they are for</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7tVl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7tVl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png 424w, https://substackcdn.com/image/fetch/$s_!7tVl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png 848w, https://substackcdn.com/image/fetch/$s_!7tVl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png 1272w, https://substackcdn.com/image/fetch/$s_!7tVl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7tVl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png" width="1183" height="676" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:676,&quot;width&quot;:1183,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1034169,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7tVl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png 424w, https://substackcdn.com/image/fetch/$s_!7tVl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png 848w, https://substackcdn.com/image/fetch/$s_!7tVl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png 1272w, https://substackcdn.com/image/fetch/$s_!7tVl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11c4d48a-86b3-408f-9cb8-275d452bfb2b_1183x676.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>One of the hardest issues in designing an evaluation matrix is deciding whose needs matter most.</p><p>An undergraduate does not need the same things from an AI search tool as a faculty researcher. An instructor does not necessarily care about the same things as an evidence synthesis librarian. A graduate student doing exploratory research has different priorities from a librarian supporting a systematic review.</p><p>For example, reproducibility and interpretability are crucial for evidence synthesis. If you are supporting a systematic review, you need to know what was searched, how it was searched, and whether the same search can be repeated. But for an undergraduate writing an essay on a fairly well-trodden topic, reproducibility may matter much less.</p><p>Similarly, an undergraduate may value ease of use, clear explanations, and help finding a few credible sources. A researcher working in an emerging area, where terminology has not yet stabilised, may care much more about retrieval depth and the ability to surface relevant papers that keyword search would miss.</p><p>Many evaluation frameworks seem to assume that there can be one universal matrix for AI search tools that apply for every task or user. They assign points to many criteria and then produce an overall score. I think this is usually a mistake.</p><p>Without a clearly stated viewpoint, the best case is that the framework becomes too diffuse to be useful. The worst case is that the designer unintentionally overly encodes their own priorities into the scoring system.</p><p>For example, a librarian might give substantial weight to features such as adminstrative features like COUNTER statistics support, authentication options,  vendor support speed because those are areas they know and need the most. Those matter for procurement and management. But they do not matter much to the actual user trying to find relevant literature.</p><p>This is why I like <a href="https://aarontay.substack.com/p/ai-academic-search-needs-better-frameworks#:~:text=Mellon%2C%20and-,Alfred%20Wallace%20at%20the%20University%20of%20North%20Dakota,-each%20built%20something">Alfred Wallace&#8217;s </a><em><a href="https://aarontay.substack.com/p/ai-academic-search-needs-better-frameworks#:~:text=Mellon%2C%20and-,Alfred%20Wallace%20at%20the%20University%20of%20North%20Dakota,-each%20built%20something">Evaluating AI Tools for Research</a></em><a href="https://aarontay.substack.com/p/ai-academic-search-needs-better-frameworks#:~:text=Mellon%2C%20and-,Alfred%20Wallace%20at%20the%20University%20of%20North%20Dakota,-each%20built%20something"> matrix</a>. It allows the evaluator to choose a role, such as faculty researcher, graduate student, undergraduate, instructor, or student. The selected role then changes which criteria are treated as priorities or key questions.</p><p>I played around and vibe coded my own AI search evaluation framework based on <a href="https://omnomdombomb.github.io/ai_evaluation_framework_tool/AI-Tool-Assessment-Framework.html">AI-Powered Tool Assessment Framework</a> and <a href="https://alfredhw.github.io/airubric/">AI Rubric - Evaluating AI Tools for Research</a>. </p><p>It is <em><strong>not very good </strong></em>currently and needs much more work, but I can show you a screencap below of roughly what I mean.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!JTir!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!JTir!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png 424w, https://substackcdn.com/image/fetch/$s_!JTir!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png 848w, https://substackcdn.com/image/fetch/$s_!JTir!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png 1272w, https://substackcdn.com/image/fetch/$s_!JTir!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!JTir!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png" width="875" height="1074" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1074,&quot;width&quot;:875,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:87870,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!JTir!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png 424w, https://substackcdn.com/image/fetch/$s_!JTir!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png 848w, https://substackcdn.com/image/fetch/$s_!JTir!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png 1272w, https://substackcdn.com/image/fetch/$s_!JTir!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23bcb6ff-a36f-4418-8f77-af26ed797ead_875x1074.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em><strong>Figure: My draft role-based framework, vibe-coded based on AI-Powered Tool Assessment Framework and AI Rubric: Evaluating AI Tools for Research. This shows how different roles have different weightings for the same criteria. </strong></em></p><p>For simplicity, I only define three roles: undergraduate, researcher, and librarian. Each criterion falls into one of three levels depending on the role: critical, key, or important. The defaults can be changed.</p><p>In my current system, answers to most criteria fall into four bands, with values from 0 to 3. These are weighted more heavily if the criterion is key rather than important. Critical criteria are handled differently as &#8220;gates&#8221;, which I will discuss below.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!i5Gh!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!i5Gh!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png 424w, https://substackcdn.com/image/fetch/$s_!i5Gh!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png 848w, https://substackcdn.com/image/fetch/$s_!i5Gh!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png 1272w, https://substackcdn.com/image/fetch/$s_!i5Gh!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!i5Gh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png" width="619" height="348" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fff6e334-9116-418a-90e7-163fcf325798_619x348.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:348,&quot;width&quot;:619,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:28041,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!i5Gh!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png 424w, https://substackcdn.com/image/fetch/$s_!i5Gh!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png 848w, https://substackcdn.com/image/fetch/$s_!i5Gh!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png 1272w, https://substackcdn.com/image/fetch/$s_!i5Gh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffff6e334-9116-418a-90e7-163fcf325798_619x348.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em><strong>Figure: For this criterion, it is defined as a key question and weighted more heavily, so this tool scores 2 x 10 = 20 points on this criteria</strong></em></p><p>We can quibble about the exact roles and weights. The principle is what matters. A framework should make clear whose interests it is optimising for.</p><p>A simplified version of what each role might prioritize might look something like this:</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Fn4q!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Fn4q!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png 424w, https://substackcdn.com/image/fetch/$s_!Fn4q!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png 848w, https://substackcdn.com/image/fetch/$s_!Fn4q!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png 1272w, https://substackcdn.com/image/fetch/$s_!Fn4q!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Fn4q!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png" width="969" height="335" data-attrs="{&quot;src&quot;:&quot;https://substackcdn.com/image/fetch/$s_!Fn4q!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:335,&quot;width&quot;:969,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:17763,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!Fn4q!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png 424w, https://substackcdn.com/image/fetch/$s_!Fn4q!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png 848w, https://substackcdn.com/image/fetch/$s_!Fn4q!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png 1272w, https://substackcdn.com/image/fetch/$s_!Fn4q!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F25e2eabb-4519-4ab9-8ff4-88f1a8884d10_969x335.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This matters because it helps libraries justify decisions more clearly for which group of users the tools are for. Instead of saying, &#8220;For all users, Tool A scored 82 and Tool B scored 76,&#8221; we can say something more meaningful: &#8220;Tool A is better for undergraduate discovery (scoring 82), while Tool B is more suitable for advanced research or evidence synthesis (scoring 92) taking into account what each cares about&#8221;</p><h2>2. Think Non-negotiable Gates not just composite scores</h2><p>Many evaluation frameworks are extremely comprehensive. They try to account for everything: retrieval, usability, accessibility, privacy, sustainability, source coverage, citation handling, export options, transparency, administration features, and more.</p><p>They assign weights to each criteria (typically evenly without much thought), expect evaluators to score each area and then sum up the scores to get a final score.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!4aUz!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!4aUz!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png 424w, https://substackcdn.com/image/fetch/$s_!4aUz!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png 848w, https://substackcdn.com/image/fetch/$s_!4aUz!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png 1272w, https://substackcdn.com/image/fetch/$s_!4aUz!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!4aUz!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png" width="1184" height="679" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:679,&quot;width&quot;:1184,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1081315,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!4aUz!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png 424w, https://substackcdn.com/image/fetch/$s_!4aUz!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png 848w, https://substackcdn.com/image/fetch/$s_!4aUz!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png 1272w, https://substackcdn.com/image/fetch/$s_!4aUz!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff1729b35-9451-47ff-b6d3-17acc9352d2d_1184x679.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>But this can result in you missing the big picture. If your mandatory requirement is accessibility for legal reasons, or if you are an evidence synthesis researcher and cannot use tools that have results are not reproducible, you should use these criteria as &#8220;gates&#8221; to test first. </p><p>By a &#8220;gate&#8221;, I mean a criterion that a tool must pass before we continue evaluating it. If the tool fails that criterion, we stop. It does not matter how well it performs on secondary features.</p><blockquote><p>Your &#8220;gates&#8221; in the context of AI search, could be environmental issues, copyright issues or impact on learning and of course performance issues. So for example, if your non-negotiable is that the AI search tool should not impact learning by generating direct answers, you might opt for the &#8220;gate&#8221; of tools that only give listing of results not answers aka Deep Search or Quick search tools.</p><p>See <strong><a href="https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered">What Do We Actually Mean by &#8220;AI-Powered Search&#8221;?</a></strong><a href="https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered"> </a></p></blockquote><p>One way to fix this is simply to set a extremely high weight to this mandatory criteria. But I think a cleaner approach is to set a minimum threshold that the gated criteria must reach, or else it fails no matter what the overall score is.</p><h2>Retrieval should be a core gate, not just another category</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!-KyP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!-KyP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png 424w, https://substackcdn.com/image/fetch/$s_!-KyP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png 848w, https://substackcdn.com/image/fetch/$s_!-KyP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png 1272w, https://substackcdn.com/image/fetch/$s_!-KyP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!-KyP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png" width="1180" height="670" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:670,&quot;width&quot;:1180,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1214029,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!-KyP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png 424w, https://substackcdn.com/image/fetch/$s_!-KyP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png 848w, https://substackcdn.com/image/fetch/$s_!-KyP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png 1272w, https://substackcdn.com/image/fetch/$s_!-KyP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9f67bdd2-2a1e-41f0-85aa-3b715d819878_1180x670.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Besides abidding by legal requirements, for AI search tools, in my view retrieval capability should be one of those gates and this is often overlooked. </p><p>A search tool with weak retrieval should not be rescued by good citation formatting, a nice interface, or convenient administrative features. Those things are useful, but only after the tool has passed the basic test of finding and ranking relevant material.</p><p>In many evaluation matrices, retrieval strength, even when combined with source coverage, ends up accounting for perhaps 20 to 25 per cent of the overall score. This often happens because frameworks have four or five broad categories and weight them equally.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!j3CQ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!j3CQ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png 424w, https://substackcdn.com/image/fetch/$s_!j3CQ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png 848w, https://substackcdn.com/image/fetch/$s_!j3CQ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png 1272w, https://substackcdn.com/image/fetch/$s_!j3CQ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!j3CQ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png" width="1182" height="689" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/cfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:689,&quot;width&quot;:1182,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:975139,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!j3CQ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png 424w, https://substackcdn.com/image/fetch/$s_!j3CQ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png 848w, https://substackcdn.com/image/fetch/$s_!j3CQ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png 1272w, https://substackcdn.com/image/fetch/$s_!j3CQ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfcf1893-c941-4e89-bc5c-85af01355440_1182x689.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>That badly underweights retrieval. Finding relevant material is the central purpose of a search tool. If the retrieval is poor, the rest is secondary.</p><p>Again, I am not arguing that retrieval overrides every other concern. I am arguing that retrieval should be treated as at least ONE core task-performance gate for search tools.</p><p>For example:</p><blockquote><p>If a tool is rated &#8220;poor&#8221; on retrieval capability, it fails the evaluation, regardless of its performance on other criteria. </p></blockquote><p>This approach forces evaluators to decide what is non-negotiable. It also prevents a tool from getting an acceptable overall score by compensating for bad retrieval with peripheral strengths.</p><p>The screenshot below shows my example, where retrieval capability, measured through a simple precision test, is set as a critical criterion. The tool needs to be rated 2 or above, corresponding to 50 to 80 per cent precision. In this example, it is rated only 1, corresponding to 31 to 50 per cent precision, so it fails the gating criterion.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!VIBe!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!VIBe!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png 424w, https://substackcdn.com/image/fetch/$s_!VIBe!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png 848w, https://substackcdn.com/image/fetch/$s_!VIBe!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png 1272w, https://substackcdn.com/image/fetch/$s_!VIBe!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!VIBe!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png" width="860" height="519" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:519,&quot;width&quot;:860,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:53928,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!VIBe!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png 424w, https://substackcdn.com/image/fetch/$s_!VIBe!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png 848w, https://substackcdn.com/image/fetch/$s_!VIBe!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png 1272w, https://substackcdn.com/image/fetch/$s_!VIBe!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14202263-38f2-4e4f-ba9a-a0173d36b71c_860x519.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em><strong>Figure: Example of a gate-based evaluation model. Retrieval capability is set as a critical criterion and requires a score of 2 or higher. The tool automatically fails here because it is rated only 1</strong></em></p><p>Tools that fail the minimum retrieval threshold are rejected before secondary criteria such as usability, citation handling, export, or administration features are considered.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!giWT!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!giWT!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png 424w, https://substackcdn.com/image/fetch/$s_!giWT!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png 848w, https://substackcdn.com/image/fetch/$s_!giWT!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png 1272w, https://substackcdn.com/image/fetch/$s_!giWT!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!giWT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png" width="862" height="710" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:710,&quot;width&quot;:862,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:45491,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!giWT!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png 424w, https://substackcdn.com/image/fetch/$s_!giWT!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png 848w, https://substackcdn.com/image/fetch/$s_!giWT!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png 1272w, https://substackcdn.com/image/fetch/$s_!giWT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e1eca59-323d-4c12-af80-f47cf7bdb35d_862x710.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em><strong>Figure: The summary screen highlights that, regardless of the overall score, the tool failed the critical criterion.</strong></em></p><p>Paying attention to retrieval is particularly important now because &#8220;AI search&#8221; is not a mature or stable category. Many vendors are under pressure to show that they are &#8220;doing AI&#8221;. Some products are genuinely rethinking retrieval. <a href="https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search">Others are merely bolting an LLM onto a conventional search system, using it to generate Boolean queries and then calling the result AI search.</a></p><p>That may or may not improve performance. Sometimes it may add little. Sometimes it may make things worse.</p><p>I have personally tested an &#8220;AI search&#8221; tool that was worse than standard lexical keyword search. It was not subtly worse. It was obviously broken. Librarians and researchers testing it could tell almost immediately that the retrieval quality was poor.</p><p>If I had treated retrieval as a gate, I could have saved everyone time before asking them to test it.</p><p>This is why a gate-based model matters. It prevents the evaluation from being diluted by a long list of attractive but secondary features and can save time.</p><h2>3. Some criteria should be made harder and more testable</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!6WuK!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!6WuK!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png 424w, https://substackcdn.com/image/fetch/$s_!6WuK!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png 848w, https://substackcdn.com/image/fetch/$s_!6WuK!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png 1272w, https://substackcdn.com/image/fetch/$s_!6WuK!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!6WuK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png" width="1180" height="667" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/a48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:667,&quot;width&quot;:1180,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1129884,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!6WuK!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png 424w, https://substackcdn.com/image/fetch/$s_!6WuK!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png 848w, https://substackcdn.com/image/fetch/$s_!6WuK!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png 1272w, https://substackcdn.com/image/fetch/$s_!6WuK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa48b819a-aad0-4dc0-9317-26e551de80c7_1180x667.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Another thing I notice about many librarian evaluation matrices is that they rely heavily on qualitative judgement.</p><p>Sometimes this is unavoidable. Some criteria really are soft. Usability, for example, is difficult to reduce to a single objective number unless you run proper usability testing, which takes time and expertise.</p><p>But some criteria can be made more empirical, especially the critical ones.</p><p>Take reproducibility. <a href="https://katinamagazine.org/content/article/reviews/2025/deep-dive-into-three-ai-academic-search-tools">A simple test is to run the same query several times and record whether the same results appear in the same order</a>. You might run the query five or ten times, possibly across different sessions or accounts to reduce caching effects, and see how stable the ranking is.</p><p>Take interpretability. If an AI search system converts a natural language query into a Boolean string, you can copy the generated Boolean query into the conventional search interface and check whether the results match. If they do not, then either the system is not doing what it claims, or the Boolean explanation does not fully represent the actual search process.</p><p>Take claim-source faithfulness. If a tool generates an answer and cites sources, evaluators can check how often the cited sources actually support the claims made. </p><blockquote><p>Michael Gusenbauer&#8217;s work has influenced many of my thoughts here. <a href="https://onlinelibrary.wiley.com/doi/10.1002/jrsm.1378">His papers offer comparatively objective ways to assess academic search systems for evidence synthesis</a>, including tests of search functionality, retrieval qualities, database size, and subject coverage. SearchSmart builds on this work <a href="https://link.springer.com/article/10.1007/s11192-022-04289-7">by estimating coverage of academic databases using methods such as query hit counts, and the Basket of Keywords approach</a>, rather than relying only on vendor descriptions or self-reported coverage.</p></blockquote><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!wAG3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!wAG3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png 424w, https://substackcdn.com/image/fetch/$s_!wAG3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png 848w, https://substackcdn.com/image/fetch/$s_!wAG3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png 1272w, https://substackcdn.com/image/fetch/$s_!wAG3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!wAG3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png" width="1174" height="660" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/aed1b816-e017-4a92-9b99-212d55693e23_1174x660.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:660,&quot;width&quot;:1174,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1077835,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!wAG3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png 424w, https://substackcdn.com/image/fetch/$s_!wAG3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png 848w, https://substackcdn.com/image/fetch/$s_!wAG3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png 1272w, https://substackcdn.com/image/fetch/$s_!wAG3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Faed1b816-e017-4a92-9b99-212d55693e23_1174x660.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>But the area where I think empirical testing matters most is retrieval capability. If retrieval is a core task-performance gate, then it should not be assessed only by impression.</p><p>This is where things get more complicated.</p><p><a href="https://alfredhw.github.io/airubric/">Alfred Wallace&#8217;s framework</a> asks evaluators to assess the &#8220;AI search architecture spectrum&#8221;, distinguishing between LLM-generated Boolean, Boolean plus reranking, hybrid search, and agentic or deep search.  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!P7u1!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!P7u1!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png 424w, https://substackcdn.com/image/fetch/$s_!P7u1!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png 848w, https://substackcdn.com/image/fetch/$s_!P7u1!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png 1272w, https://substackcdn.com/image/fetch/$s_!P7u1!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!P7u1!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png" width="976" height="699" data-attrs="{&quot;src&quot;:&quot;https://substackcdn.com/image/fetch/$s_!P7u1!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:699,&quot;width&quot;:976,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:45991,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!P7u1!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png 424w, https://substackcdn.com/image/fetch/$s_!P7u1!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png 848w, https://substackcdn.com/image/fetch/$s_!P7u1!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png 1272w, https://substackcdn.com/image/fetch/$s_!P7u1!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9766d8d1-4cb0-4209-9509-388757111908_976x699.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em><strong>Figure: Alfred Wallace&#8217;s framework asks evaluators to assess the AI search architecture spectrum.</strong></em></p><p>That is a useful first approximation. In general, I would expect a well-implemented agentic or deep search tool to outperform a tool that simply asks an LLM to generate a Boolean query and then runs it through a conventional retrieval system.</p><p>But retrieval is messy. Implementation matters. A poorly implemented &#8220;deep search&#8221; tool may perform worse than a simpler hybrid system. Marketing labels are not enough.</p><p>So we need empirical tests, even if they are rough.</p><h2>How might librarians test retrieval strength?</h2><p>Last May, I wrote two posts on <a href="https://aarontay.substack.com/p/testing-ai-academic-search-engines-1">testing AI academic search engines(I)</a> and <a href="https://aarontay.substack.com/p/testing-ai-academic-search-engines-what">(II)</a>. I also drafted a third post focused specifically on retrieval testing, but it became too long and technical. It went from <a href="https://trec.nist.gov/">TREC-style ad hoc retrieval evaluation </a>to <a href="https://trec-rag.github.io/trec24/">modern RAG evaluation</a>, and I eventually decided it was probably too much for the audience I had in mind.</p><p>The challenge is balance. We should not expect most librarians to run formal information retrieval evaluations. We are not trying to reproduce <a href="https://trec.nist.gov/">TREC methodology</a>, nor are we trying to run a <a href="https://pmc.ncbi.nlm.nih.gov/articles/PMC10107874/">Study Within A Review</a> such as <a href="https://www.medrxiv.org/content/10.64898/2026.04.13.26350802v1.full-text">the Cochrane Evaluation of (Semi-) Automated Review methods(CESAR).</a> </p><p><em>But we can do better than impressions.</em></p><p>Below are two lightweight but far from perfect tests of retrieval for librarian evaluations of search tools that you can try<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>.</p><p>This will not produce bullet-proof, publishable IR research. But it is often better than simply giving your feelings on whether the results &#8220;look good&#8221; in general.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!8AWr!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!8AWr!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png 424w, https://substackcdn.com/image/fetch/$s_!8AWr!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png 848w, https://substackcdn.com/image/fetch/$s_!8AWr!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png 1272w, https://substackcdn.com/image/fetch/$s_!8AWr!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!8AWr!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png" width="1200" height="680" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2640528c-4ac3-481b-a935-d413ee136655_1200x680.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:680,&quot;width&quot;:1200,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:985296,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!8AWr!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png 424w, https://substackcdn.com/image/fetch/$s_!8AWr!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png 848w, https://substackcdn.com/image/fetch/$s_!8AWr!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png 1272w, https://substackcdn.com/image/fetch/$s_!8AWr!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2640528c-4ac3-481b-a935-d413ee136655_1200x680.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2>Retrieval test 1: recall@K using a known set</h2><p>One relatively simple test is to use a topic where you already know many relevant papers and feel you likely have most if not all relevant papers.</p><p>For example, suppose you have worked extensively on a topic and already have a set of papers you consider relevant. You can treat that set as a rough gold standard. Then you run the same query in each AI search tool and check how many of those known relevant papers appear in the top K results.</p><p>This gives you recall@K.</p><p>For example, if your gold standard set has 20 relevant papers, and a tool retrieves 8 of them in the top 30 results, then its recall@30 is 8/20, or 40%.</p><p>The question, of course, is what value of K to use. There is no universal answer. Common values might be 10, 20, or 50. Personally, I would often use 20 or 50 because that roughly matches the number of results I am likely to scan seriously.</p><p>One obvious source of gold standard sets is systematic reviews, meta-analyses, review articles, and survey papers. You can use their included studies or references as a benchmark.</p><p>There is a catch. If the review article has already been published, some AI search tools may find the review itself and mine its references. That makes the test less clean. Still, for practical library evaluation, it may be good enough, especially if the aim is not formal research but comparative assessment.</p><p>For more sophisticated testing, you could also use <a href="https://www.evidentlyai.com/ranking-metrics/ndcg-metric">NDCG@K, or Normalised Discounted Cumulative Gain</a>. This is rank-sensitive, meaning it gives more credit when highly relevant results appear near the top.</p><h2>Retrieval test 2: precision@K when no gold standard exists</h2><p>Not everyone has a gold standard set of papers lying around. In that case, a more realistic test is precision@K.</p><p>The process is simple:</p><ol><li><p>Choose a realistic query.</p></li><li><p>Run it in each tool.</p></li><li><p>Look at the top K results, such as the top 10.</p></li><li><p>Judge how many are relevant.</p></li><li><p>Calculate the proportion of relevant results.</p></li></ol><p>If 7 of the top 10 results are relevant, precision@10 is 70%.</p><p>This is easy to understand and relatively easy to run. It does not tell you whether the tool found all the relevant literature, but it does tell you whether the top results are useful.</p><p>For many users, especially undergraduates and those just doing quick exploratory searches, this may be a reasonable test. They are often not trying to find everything. They are trying to find enough good material quickly.</p><p>However, precision@K has a limitation: it is not order-sensitive. A tool that places the best result at rank 1 and another that places it at rank 10 may receive the same precision@10 score. If ranking quality matters, you could also consider <a href="https://www.evidentlyai.com/ranking-metrics/mean-average-precision-map">Average Precision (AP@K)  </a></p><p>Again, though, I would not overcomplicate this at the start. A rough precision@10 test across several realistic queries is already useful. In fact, I suspect most librarians or researchers already sort of do that, just that they don&#8217;t formally keep track of it.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!CHrJ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!CHrJ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png 424w, https://substackcdn.com/image/fetch/$s_!CHrJ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png 848w, https://substackcdn.com/image/fetch/$s_!CHrJ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png 1272w, https://substackcdn.com/image/fetch/$s_!CHrJ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!CHrJ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png" width="600" height="599" data-attrs="{&quot;src&quot;:&quot;https://substackcdn.com/image/fetch/$s_!CHrJ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:599,&quot;width&quot;:600,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:88115,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!CHrJ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png 424w, https://substackcdn.com/image/fetch/$s_!CHrJ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png 848w, https://substackcdn.com/image/fetch/$s_!CHrJ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png 1272w, https://substackcdn.com/image/fetch/$s_!CHrJ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0371aac0-1b25-4883-9b1a-02d804c8bd5d_600x599.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em><strong>Figure - Three lightweight ways to test retrieval strength.</strong><br> </em></p><h2>Why formal information retrieval is not easy</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!PdMN!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!PdMN!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png 424w, https://substackcdn.com/image/fetch/$s_!PdMN!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png 848w, https://substackcdn.com/image/fetch/$s_!PdMN!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png 1272w, https://substackcdn.com/image/fetch/$s_!PdMN!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!PdMN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:594798,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!PdMN!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png 424w, https://substackcdn.com/image/fetch/$s_!PdMN!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png 848w, https://substackcdn.com/image/fetch/$s_!PdMN!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png 1272w, https://substackcdn.com/image/fetch/$s_!PdMN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F37dcd5bd-9de1-4344-bf1e-38c53dab61a3_1024x559.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Studying and evaluating information retrieval results requires a ton of expertise.</p><p>I don&#8217;t want to make the discussion too technical but here are several issues that complicate the story.</p><ul><li><p>We need to distinguish corpus coverage from retrieval and ranking. A tool may fail to retrieve a paper because it is not in the corpus, because the query did not match it, or because the ranking pushed it too far down - when Undermind does not find a known gold standard relevant result at say recall@50, you should do a known item search in the source it uses to check if the fails is due to the corpus or the search</p></li><li><p>We need to be careful when using known sets from systematic reviews, meta-analyses, review articles, or survey papers. These can be useful, but they are not perfect gold standards.</p></li><li><p>Precision testing sounds simple, but formally, you have to ensure there are clear inclusion and exclusion critera before judging the results and to ideally need multiple assessors to avoid becoming just another form of subjective impression<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-3" href="#footnote-3" target="_self">3</a>.</p></li><li><p>We need to choose metrics that are understandable and appropriate. Precision@K, recall@K, known-item success, NDCG@K, and MAP@K answer slightly different questions.</p></li><li><p>We will have difficulty deciding what is a &#8220;normal&#8221; baseline recall/precision@K etc for an academic search. What could be the baseline? Google Scholar? Your library catalog/discovery service?</p></li></ul><p>These are important, and I will discuss them issues and more in future posts. For this post, the simpler point is enough: if retrieval is central to the purpose of the tool, then retrieval should be tested, not merely described.</p><h2>Choosing good test queries</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!BuKK!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!BuKK!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png 424w, https://substackcdn.com/image/fetch/$s_!BuKK!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png 848w, https://substackcdn.com/image/fetch/$s_!BuKK!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png 1272w, https://substackcdn.com/image/fetch/$s_!BuKK!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!BuKK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png" width="1194" height="663" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/974a3124-9918-4cac-8964-359da28142cf_1194x663.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:663,&quot;width&quot;:1194,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1292802,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!BuKK!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png 424w, https://substackcdn.com/image/fetch/$s_!BuKK!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png 848w, https://substackcdn.com/image/fetch/$s_!BuKK!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png 1272w, https://substackcdn.com/image/fetch/$s_!BuKK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F974a3124-9918-4cac-8964-359da28142cf_1194x663.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Still, I want to briefly discuss a critical issue when testing search engines. Choosing which queries to test is obviously tricky.</p><p>But a very common mistake I see is testing only &#8220;easy&#8221; queries. An &#8220;easy&#8221; query is not always the same as a broad query, but the two often overlap. If your topic has many obviously and easily found (because terminology is known and stable) relevant papers, most decent systems will return something plausible. That makes it hard to distinguish strong retrieval systems from merely adequate ones and with &#8220;AI search&#8221; we want to do that.</p><blockquote><p>I occasionally see librarians say the new class of AI search engine isn&#8217;t much better than conventional search mostly because they make this mistake or alternatively they can&#8217;t tell the difference between AI search engines of obviously different quality as the test results look close.</p></blockquote><p>You can often tell this is happening when <em>multiple retrieval systems achieve high apparent precision but return very different sets of results with low overlap</em>. Low overlap between systems may suggest that there are many relevant papers in the index, so the test is not very discriminating.</p><p>A better test set should include some harder queries. For example:</p><ul><li><p>topics where terminology varies across disciplines;</p></li><li><p>emerging topics where vocabulary has not stabilised;</p></li><li><p>interdisciplinary questions;</p></li><li><p>questions involving very specific conditions for relevance;</p></li><li><p>known-item searches for papers that should be found but are not obvious from simple keywords.</p></li></ul><p>Overall, if you know your query has very few relevant articles and those articles cannot be found easily with trivial keywords, the query is likely to be hard.</p><p>How many queries should you test? The glib answer is: as many as you can. You could even crowdsource them. But some testing is better than none.</p><p>I find even five well-chosen queries can reveal a lot, allowing you to distinguish the average from the best, especially if they include difficult cases.</p><h2>The unanswered question about cost</h2><p>Even if a tool passes the retrieval gate and satisfies role-specific criteria, there is one final pragmatic hurdle: the cost-to-performance ratio.</p><p>In the information retrieval research community, people often chase marginal gains in metrics such as Mean Average Precision (Average Precision across multiple queries) without caring the cost (in terms of compute or latency). In an institutional library context, the question is different. A 5 per cent improvement in retrieval performance may or may not justify a much higher subscription cost, additional staff training or even privacy risk.</p><p>So the question is not simply whether Tool B retrieves slightly better results than Tool A. The question is whether that improvement is worth the cost and trade-offs for the institution and for the users the library is trying to serve.</p><p>That is not an easy question. But at least a role-based, gate-based, test-informed framework gives us a better way to ask it.</p><h2>What this means for AI search evaluation frameworks</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!4E9L!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!4E9L!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png 424w, https://substackcdn.com/image/fetch/$s_!4E9L!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png 848w, https://substackcdn.com/image/fetch/$s_!4E9L!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png 1272w, https://substackcdn.com/image/fetch/$s_!4E9L!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!4E9L!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png" width="1180" height="685" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:685,&quot;width&quot;:1180,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:944030,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/195558378?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!4E9L!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png 424w, https://substackcdn.com/image/fetch/$s_!4E9L!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png 848w, https://substackcdn.com/image/fetch/$s_!4E9L!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png 1272w, https://substackcdn.com/image/fetch/$s_!4E9L!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1732fd2b-7bb8-473c-b73b-3e96299f7e07_1180x685.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Putting all this together, I would make three changes to most AI search evaluation frameworks.</p><p>First, I would scope the framework to a specific user role and task. A single universal score is usually misleading. The better question is: useful for whom, and for what purpose?</p><p>Second, I would treat retrieval capability as a core task-performance gate for search tools. This does not mean retrieval is the only possible hard gate. Privacy, accessibility, licence terms, data governance, and institutional requirements may also be non-negotiable. But if we are evaluating a search tool, it should first be able to search well.</p><p>Third, I would make at least some criteria more empirical. Reproducibility can be tested by rerunning queries. Interpretability can sometimes be tested by comparing generated search strings with actual results. Claim-source faithfulness can be tested by checking whether cited sources support generated claims. Retrieval can be tested, even lightly, using realistic queries and simple measures of usefulness.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi!</span></a></p><p>The gating point matters most to me. A search tool with weak retrieval is not redeemed by good citation handling, a polished interface, or convenient administration features. Those things matter, but only after the tool has passed the basic test of finding useful material.</p><p><em><strong>I am not planning to publish my own framework.</strong></em> I do not want the maintenance burden, and I do not have a strong personal use case for one.</p><p>But if you are building one, my advice is simple: decide who it is for, decide what is non-negotiable, and make the most important criteria as testable as you reasonably can.</p><p>In future posts, I will go deeper into retrieval testing itself. </p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe now&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/subscribe?"><span>Subscribe now</span></a></p><p></p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>To be fair, this framework doesn&#8217;t seem focused just on AI <em><strong>search</strong></em> tools, but also covers other literature review tools like &#8220;citation-based literature mapping tools&#8221; like Research Rabbit, Connected Papers and Litmaps.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>&#8220;Retrieval capability&#8221; is multi-dimensional and there are many ways to measure it. Though I suggest just one lightweight test, formal testing would often measure retrieval capablity in multiple ways to get the full picture. If you include search engines that generate RAG type answers, there are even more metrics to use for measurement.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-3" href="#footnote-anchor-3" class="footnote-number" contenteditable="false" target="_self">3</a><div class="footnote-content"><p>We need to define relevance criteria before judging results. Though this does not mean building a full gold-standard set in advance. TREC-style pooling, for example, judges documents after they have been retrieved. But the topic, task, and judgement rules still need to be clear; otherwise a lightweight precision test can collapse back into subjective impression.</p><p></p></div></div>]]></content:encoded></item><item><title><![CDATA[AI academic search needs better frameworks for understanding and evaluation. These three librarian projects are a start]]></title><description><![CDATA[What it looks like when the AI search conversation and understanding gets serious]]></description><link>https://aarontay.substack.com/p/ai-academic-search-needs-better-frameworks</link><guid isPermaLink="false">https://aarontay.substack.com/p/ai-academic-search-needs-better-frameworks</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Mon, 20 Apr 2026 17:04:28 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!Trq3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp" length="0" type="image/jpeg"/><content:encoded><![CDATA[<p>Most librarian commentary on AI search still operates at the level of warnings and impressions. Tools hallucinate. Sources are opaque. Students should be cautious. None of this is wrong, but none of it helps a colleague decide whether Undermind is appropriate for a scoping review or whether SciSpace&#8217;s summaries can be trusted in a literature class.</p><p>What would help is work that treats these systems as understandable and evaluable: layered architectures with retrieval components, generation components, interfaces, and trade-offs that can be named and weighed.</p><p>As <a href="https://mikecaulfield.substack.com/p/its-a-fancy-search-result?utm_source=share&amp;utm_medium=android&amp;r=62upd&amp;triedRedirect=true">Mike Caulfield of SIFT fame has observed there is great value and explanatory power to see what AI does from the lens of &#8220;a fancy search result&#8221; rather than just an answer.</a> He notes</p><blockquote><p>&#8230; stop thinking of the result as an answer, and start thinking of it as a search result with some synthesis on top. When all the sources are in alignment that can of course present as an answer &#8212; but it still is downstream from available sources, it still has made decisions about weighting, and so forth. If you think of it as a dressed up search result instead of an intelligence (albeit one that can synthesize in impressive ways) you&#8217;ll be better able to process the weirdness that sometimes results.</p></blockquote><p>Over the last week, three librarians &#8212; none of them coordinating with me or with each other &#8212; have published work on AI search that lean in this more productive direction.  <a href="https://library.hkust.edu.hk/news-events/news/snapshot-genai-tools-research">Aster Zhao at HKUST</a>, <a href="https://omnomdombomb.github.io/ai_evaluation_framework_tool/AI-Tool-Assessment-Framework.html">Wang Huajin at Carnegie Mellon</a>, and <a href="https://alfredhw.github.io/airubric/">Alfred Wallace at the University of North Dakota</a> each built something concrete: an interface, a framework, a rubric (vibe coded with Claude). All three happen to cite my work, which is flattering.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi!</span></a></p><p>Taken together, these three projects make a point I keep returning to. The conversation around AI search needs to happen at a better level. We need fewer sweeping claims and more attempts to clarify how systems differ, what assumptions they encode, and how they should be assessed for particular tasks.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><h2>1. Aster Zhao&#8217;s (Hong Kong University of Science and Technology) snapshot of GenAI tools for research</h2><p>The first example is by Aster Zhao from HKUST Library: <strong><a href="https://library.hkust.edu.hk/news-events/news/snapshot-genai-tools-research">Snapshot of GenAI Tools for Research</a></strong><a href="https://library.hkust.edu.hk/news-events/news/snapshot-genai-tools-research">.</a> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Trq3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Trq3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp 424w, https://substackcdn.com/image/fetch/$s_!Trq3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp 848w, https://substackcdn.com/image/fetch/$s_!Trq3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp 1272w, https://substackcdn.com/image/fetch/$s_!Trq3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Trq3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp" width="492" height="855" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:855,&quot;width&quot;:492,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Trq3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp 424w, https://substackcdn.com/image/fetch/$s_!Trq3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp 848w, https://substackcdn.com/image/fetch/$s_!Trq3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp 1272w, https://substackcdn.com/image/fetch/$s_!Trq3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff31c413-cb8e-40b9-a96d-266262e1036c_492x855.webp 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>What I like about this one is that it does more than list tools (and a very comprehensive list it is with 40+ tools). Besides a comprehensive table view, it includes a strong timeline showing the evolution of AI search and the different &#8220;roles&#8221; that AI plays in search tools. That visual layer makes a messy landscape much easier to understand.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!oG7B!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!oG7B!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp 424w, https://substackcdn.com/image/fetch/$s_!oG7B!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp 848w, https://substackcdn.com/image/fetch/$s_!oG7B!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp 1272w, https://substackcdn.com/image/fetch/$s_!oG7B!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!oG7B!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp" width="485" height="973" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:973,&quot;width&quot;:485,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!oG7B!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp 424w, https://substackcdn.com/image/fetch/$s_!oG7B!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp 848w, https://substackcdn.com/image/fetch/$s_!oG7B!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp 1272w, https://substackcdn.com/image/fetch/$s_!oG7B!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff0fdc736-3a88-4a0b-a3d6-99282d78b361_485x973.webp 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7Zyz!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7Zyz!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp 424w, https://substackcdn.com/image/fetch/$s_!7Zyz!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp 848w, https://substackcdn.com/image/fetch/$s_!7Zyz!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp 1272w, https://substackcdn.com/image/fetch/$s_!7Zyz!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7Zyz!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp" width="492" height="964" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:964,&quot;width&quot;:492,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7Zyz!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp 424w, https://substackcdn.com/image/fetch/$s_!7Zyz!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp 848w, https://substackcdn.com/image/fetch/$s_!7Zyz!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp 1272w, https://substackcdn.com/image/fetch/$s_!7Zyz!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77663737-7f0c-44ec-a51f-a691ac253933_492x964.webp 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The work also cites some of my own frameworks and distinctions, including:</p><ul><li><p><a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">the four-quadrant framework, which divides search into Quick Search, Quick RAG, Deep Search, and Deep RAG</a></p></li><li><p><a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">The distinction between academic deep search tools that are &#8220;workflow-bound&#8221; vs autonomous , with the former struggling when asked to do tasks they were not designed for.</a></p></li><li><p><a href="https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search">The Horseless Carriage of AI Search</a>, where I critique vendors trying to sell and equate &#8220;AI search&#8221; to just simplistic use of LLMs for Boolean query construction and similar bolt-on approaches, while ignoring other more productive approaches like semantic search, better reranking and agentic search.</p></li></ul><p>Overall, this is a strong and current map of the space, helping people to see that AI search is not one thing.  I have been planning to update <a href="https://musingsaboutlibrarianship.blogspot.com/p/list-of-academic-search-engines-that.html">my own list of such tools here</a> but Aster&#8217;s work has reduced my incentive to do so.</p><h2>2. Wang Huajin&#8217;s (Carnegie Mellon University) AI-Powered Tool Assessment Framework</h2><p>The second example is <strong><a href="https://omnomdombomb.github.io/ai_evaluation_framework_tool/AI-Tool-Assessment-Framework.html">AI-Powered Tool Assessment Framework</a></strong><a href="https://omnomdombomb.github.io/ai_evaluation_framework_tool/AI-Tool-Assessment-Framework.html"> </a>by Wang Huajin of CMU.</p><p>This project is especially interesting because I often get asked during my talks or workshops for an evaluation framework for AI search tools, and in truth I have not been fully happy with many of the existing ones (more on that later). This framework gets closer to something I could actually endorse.</p><p>It asks evaluators to consider questions across four areas: retrieval, generation, output, and usability. That already puts it ahead of a great deal of discussion, because it treats these systems as layered and evaluable rather than as black boxes that either &#8220;work&#8221; or &#8220;hallucinate&#8221;.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mgPn!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mgPn!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp 424w, https://substackcdn.com/image/fetch/$s_!mgPn!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp 848w, https://substackcdn.com/image/fetch/$s_!mgPn!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp 1272w, https://substackcdn.com/image/fetch/$s_!mgPn!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mgPn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp" width="754" height="1064" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1064,&quot;width&quot;:754,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mgPn!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp 424w, https://substackcdn.com/image/fetch/$s_!mgPn!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp 848w, https://substackcdn.com/image/fetch/$s_!mgPn!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp 1272w, https://substackcdn.com/image/fetch/$s_!mgPn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6b28ca7e-061a-4f2b-813f-8dc61100a435_754x1064.webp 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>It appears to draw substantially on my older <strong>Testing AI Academic Search Engines</strong> series (<a href="https://aarontay.substack.com/p/testing-ai-academic-search-engines-1">part I</a> and <a href="https://aarontay.substack.com/p/testing-ai-academic-search-engines-what">II</a>) - adapting many of the questions I put in them, though I do not want to overstate my influence here. There is at least one section, on sustainability, that does not come from me, and that is a good thing.  </p><p>Huajin will also be presenting at <strong><a href="https://event.fourwaves.com/force2026/abstracts/8d848fe4-009f-48f5-b031-7dd04107d950">FORCE2026 in June in Singapore on &#8220;Developing an assessment framework to support critical evaluation of AI-powered academic search engines&#8221;</a></strong>, which suggests this is not just a quick web experiment but part of a serious and wider conversation within her institution. I am looking forward to her presentation.</p><p></p><h2>3. Alfred Wallace&#8217;s (University of North Dakota) adjustable rubric for AI search tools</h2><p>One reason I have resisted producing a neat evaluation matrix with fixed weights, a catchy name, and a polished PDF is that evaluation is rarely one-size-fits-all. Different users, tasks, and contexts demand different priorities. A tool useful for helping undergraduates find a few relevant papers will be unsuitable for a search tool meant for higher recall results. A tool that is fast and convenient may be unacceptable if transparency or source traceability matters.</p><p>The third project by Alfred Wallace at the University of North Dakota - <a href="https://alfredhw.github.io/airubric/">Evaluating AI Tools for Research</a> handles this better than most. Its structure is fairly traditional, focusing on sources, models, and wrappers, and the categories themselves are not ground-breaking. </p><p>The framework incorporates the provenance of the tool (established vendor, startup, or user-built), which is essential for maintaining a macro-level, long-term perspective beyond isolated feature sets.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!2VyU!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!2VyU!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png 424w, https://substackcdn.com/image/fetch/$s_!2VyU!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png 848w, https://substackcdn.com/image/fetch/$s_!2VyU!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png 1272w, https://substackcdn.com/image/fetch/$s_!2VyU!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!2VyU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png" width="984" height="488" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:488,&quot;width&quot;:984,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:41387,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/194669966?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!2VyU!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png 424w, https://substackcdn.com/image/fetch/$s_!2VyU!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png 848w, https://substackcdn.com/image/fetch/$s_!2VyU!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png 1272w, https://substackcdn.com/image/fetch/$s_!2VyU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F29669988-7ea7-4a37-bd9e-eb25531ddacc_984x488.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Finally, it has one important feature: users can adjust weights of criteria when calculating a final score. That is a much more sensible approach than pretending there is a universal rubric that works equally well for everyone.  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!zzBa!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!zzBa!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp 424w, https://substackcdn.com/image/fetch/$s_!zzBa!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp 848w, https://substackcdn.com/image/fetch/$s_!zzBa!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp 1272w, https://substackcdn.com/image/fetch/$s_!zzBa!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!zzBa!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp" width="726" height="1069" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1069,&quot;width&quot;:726,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!zzBa!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp 424w, https://substackcdn.com/image/fetch/$s_!zzBa!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp 848w, https://substackcdn.com/image/fetch/$s_!zzBa!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp 1272w, https://substackcdn.com/image/fetch/$s_!zzBa!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F40343e95-3c8c-4b04-82e0-3ccbc751ba0a_726x1069.webp 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>As it now stands, you select a Scenario based on whether you are a faculty researcher, Graduate Student, Undergraduate, instructor or student which will automatically flag different criteria as either &#8220;priority&#8221; or &#8220;key question&#8221; categories that affect the weighting. While you cannot change which criteria<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a> are considered &#8220;priority&#8221; or &#8220;key question&#8221;, you can change the size of the multiplier for criteria in either categories.</p><p>The criteria listed also reflect an informed understanding of how AI search systems differ architecturally. Alfred cites my writing  <strong>(citing specifically the <a href="https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search">horseless carriage post</a>)</strong> to support his &#8220;AI search architecture spectrum&#8221;, including the distinctions between LLM-only approaches, Boolean generation, Boolean plus reranking, hybrid search, and agentic or deep search.</p><p>Again, what matters here is not whether every category or weighting is perfect. It is that the tool reflects a more informed understanding of how AI search systems differ under the hood.</p><p>This project ends with a fascinating section on &#8220;Visions of the future&#8221; including the <a href="https://aarontay.substack.com/p/from-fixed-search-workflows-to-agentic">struggle between a future where users work on explicit platforms (both existing and new ones) vs ones where &#8220;literature research lives in the same tool that does data analysis, coding&#8230;&#8221;. </a></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!17nw!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!17nw!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png 424w, https://substackcdn.com/image/fetch/$s_!17nw!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png 848w, https://substackcdn.com/image/fetch/$s_!17nw!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png 1272w, https://substackcdn.com/image/fetch/$s_!17nw!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!17nw!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png" width="1009" height="736" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:736,&quot;width&quot;:1009,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:49598,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/194669966?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!17nw!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png 424w, https://substackcdn.com/image/fetch/$s_!17nw!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png 848w, https://substackcdn.com/image/fetch/$s_!17nw!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png 1272w, https://substackcdn.com/image/fetch/$s_!17nw!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1728f0bd-a9f6-464a-8873-c43f2290d654_1009x736.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2>Conclusion</h2><p>To be clear, I do not want to overstate my influence on any of these projects. Nor do I necessarily endorse every detail in all three. </p><blockquote><p>In fact, I have many things to say about assessment frameworks and metrics for AI search tools in my next post.  </p></blockquote><p>But I do think they are all amazing attempts to engage with AI search by librarians.</p><p>That said, three projects, all citing me have an obvious selection effect: the librarians already engaging at this level are precisely the ones likely to read what I write<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>. So this is not the strongest evidence that the wider conversation has shifted. Still, anecdotally, looking at recorded talks and presentations by academic librarians, there seems to be much more understanding of how AI search works under the hood compared to say in 2023/2024.  </p><p>If AI search tools are going to become part of academic workflows, we need more work of this kind: work that helps us distinguish between kinds of systems, evaluate them in context, and make their assumptions more visible. Blog posts can start those conversations. Interfaces, frameworks, and rubrics make the ideas usable for others. </p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi</span></a></p><h2>Bonus</h2><p>As a bonus example, I would also point to <a href="https://library.smu.edu.sg/topics-insights/what-if-claude-or-chatgpt-could-search-academic-databases-you-and-then-do-something">my recent SMU Libraries piece on MCP for researchers.</a> It is doing something slightly different from the three projects above, but in a complementary way. </p><p>Rather than offering a framework or rubric, it tries to explain in concrete terms what happens when tools like Scite and Consensus are connected to Claude or ChatGPT via MCP, so that the model can search across sources, compare results, and carry out multi-step academic workflows on the user&#8217;s behalf. </p><p>In that sense, it is less about evaluating AI search and more about making the underlying infrastructure and possibilities legible to researchers. It is also, I think, one of my clearer pieces on the topic, partly because it was written for an institutional audience rather than as one of my longer blog posts where I am often thinking aloud.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe now&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/subscribe?"><span>Subscribe now</span></a></p><p></p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>This is something easily changed with simple vibe-coding of course.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>Of the three librarians, I have probably had the most contact with Aster, who attended the first run of my intensive 3 session &#8220;AI-powered search for librarians&#8221; course in July 2025.</p><p></p></div></div>]]></content:encoded></item><item><title><![CDATA[From Fixed Search Workflows to Agentic Academic Search: Promise, Progress, and the Invisible Menu Problem]]></title><description><![CDATA[Undermind's Projects features gives a taste of the promise and challenges of managing agents by users]]></description><link>https://aarontay.substack.com/p/from-fixed-search-workflows-to-agentic</link><guid isPermaLink="false">https://aarontay.substack.com/p/from-fixed-search-workflows-to-agentic</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Sun, 12 Apr 2026 08:18:38 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!TIeP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!TIeP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!TIeP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png 424w, https://substackcdn.com/image/fetch/$s_!TIeP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png 848w, https://substackcdn.com/image/fetch/$s_!TIeP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png 1272w, https://substackcdn.com/image/fetch/$s_!TIeP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!TIeP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png" width="1250" height="708" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:708,&quot;width&quot;:1250,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1816601,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!TIeP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png 424w, https://substackcdn.com/image/fetch/$s_!TIeP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png 848w, https://substackcdn.com/image/fetch/$s_!TIeP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png 1272w, https://substackcdn.com/image/fetch/$s_!TIeP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6580af37-9e13-42b1-837d-bb4e006b6245_1250x708.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><h2>Introduction</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!cSQw!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!cSQw!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png 424w, https://substackcdn.com/image/fetch/$s_!cSQw!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png 848w, https://substackcdn.com/image/fetch/$s_!cSQw!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png 1272w, https://substackcdn.com/image/fetch/$s_!cSQw!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!cSQw!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png" width="1205" height="669" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:669,&quot;width&quot;:1205,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:678110,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!cSQw!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png 424w, https://substackcdn.com/image/fetch/$s_!cSQw!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png 848w, https://substackcdn.com/image/fetch/$s_!cSQw!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png 1272w, https://substackcdn.com/image/fetch/$s_!cSQw!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F89a7cf8a-d90b-42ba-86e0-d4be4cea3756_1205x669.png 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Academic search tools might be moving towards a different architectural model. <a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">The first generation of AI-powered literature review tools &#8212; Undermind, Consensus Deep Search, AI2&#8217;s Asta &#8212; relied on predetermined, hand-crafted workflows. </a>You entered a query, the system executed a fixed pipeline, and you received results. The LLM&#8217;s role was largely confined to query understanding and output formatting.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!yGSh!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!yGSh!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png 424w, https://substackcdn.com/image/fetch/$s_!yGSh!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png 848w, https://substackcdn.com/image/fetch/$s_!yGSh!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png 1272w, https://substackcdn.com/image/fetch/$s_!yGSh!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!yGSh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png" width="1209" height="682" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:682,&quot;width&quot;:1209,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1107654,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!yGSh!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png 424w, https://substackcdn.com/image/fetch/$s_!yGSh!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png 848w, https://substackcdn.com/image/fetch/$s_!yGSh!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png 1272w, https://substackcdn.com/image/fetch/$s_!yGSh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09601733-d2d2-4db2-b8b6-e746263bf812_1209x682.png 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>That might be changing. As LLMs have become more capable of flexible, multi-step reasoning, vendors are beginning to build systems where the AI can dynamically select and chain tools to accomplish tasks that were never explicitly programmed on their platforms. This may mark a move from academic pre-defined &#8220;deep research&#8221; workflows to more flexible agentic search flows<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a> being available on vendor platforms and in this post, I will discuss some of the early examples such as Undermind Projects.</p><p>But this shift introduces a problem that is not getting enough attention. When a system can theoretically do anything, how does the user discover what it can actually do? </p><p>Unlike a advanced user who sets up his Claude Code as a &#8220;research agent&#8221;, a user of a vendor platform has nearly no insight to how the agents have been setup by the vendor. </p><p>I call this the &#8216;invisible menu&#8217; problem  (a rename of what I previously called the <a href="https://aarontay.substack.com/p/the-blank-box-problem-why-its-harder">&#8220;blank box&#8221; problem</a>) and I think it may become one of the new usability challenges for the next generation of AI academic search tools that include agents on their platform.</p><p>The problem is compounded by the fact that, unlike traditional library search tools where decades of use have established shared conventions and mental models, agentic search is so new that users have no baseline expectations for what these systems should even be capable of.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/from-fixed-search-workflows-to-agentic?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/p/from-fixed-search-workflows-to-agentic?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p><p><a href="https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search">In my previous post</a>, I argued that bolting LLMs onto legacy search paradigms, what I called the "horseless carriage" approach, delivers limited benefit, and that most of the potential improvements in search will come from better reranking and agentic search.</p><p>In this post, I examine how three tools (Elicit, Undermind, and SciSpace) are attempting to move towards embedding agentic capabilities or flows in their platform. I use Elicit and especially Undermind's new Projects feature as the main worked examples and using what I find using them to illustrate the invisible menu problem in practice. SciSpace is discussed more briefly as a contrast point, since I have not tested it as deeply. </p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi</span></a></p><h2>Why agentic now?</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!TmXF!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!TmXF!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png 424w, https://substackcdn.com/image/fetch/$s_!TmXF!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png 848w, https://substackcdn.com/image/fetch/$s_!TmXF!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png 1272w, https://substackcdn.com/image/fetch/$s_!TmXF!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!TmXF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png" width="1209" height="681" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:681,&quot;width&quot;:1209,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:977506,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!TmXF!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png 424w, https://substackcdn.com/image/fetch/$s_!TmXF!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png 848w, https://substackcdn.com/image/fetch/$s_!TmXF!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png 1272w, https://substackcdn.com/image/fetch/$s_!TmXF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2c58f1a3-16b3-4eec-9933-6de7531f58ff_1209x681.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><a href="https://world.hey.com/ian.mulvany/current-state-of-ai-scholarly-discovery-services-2c21cd32">Ian Mulvany, CTO of BMJ Group, responded to my earlier post on the lack of agency in academic deep research tools </a>with an observation that captures the moment well: &#8220;The fixed workflows that the current crop of tools are showing were developed when models were weaker, yet from a product perspective, trying to build something that is simultaneously specific and general, is really hard.&#8221;</p><blockquote><p>Incidentally, Ian Mulvany will be the second keynote speaker for FORCE 2026 to be held in Singapore, 3-5 June - speaking on &#8220;<a href="https://event.fourwaves.com/force2026/schedule/6c16e29d-7022-45c8-8c84-a2e9e6231ef3">Surviving the Disruption: Scholarly Communication in the Age of AI</a>&#8221;. FORCE2026, will have many tracks on this topic, <a href="https://library.smu.edu.sg/topics-insights/force2026-comes-smu-why-attend-ii-ai-research-workflows">including but not restricted to impact of AI on literature review </a>(including a presentation by yours truly on &#8220;<a href="https://event.fourwaves.com/force2026/abstracts/93f20703-b372-4dd9-9605-58f01ba4791b">Does Agentic Deep Search Converge? Reproducibility Questions for LLM-Driven Literature Discovery</a>&#8221;</p></blockquote><p>He is right. The tools I tested in <a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">that earlier post</a> often struggled when asked to do things outside their intended workflows, even when they seemed to have some of the underlying capabilities needed to succeed. The models either were not yet good enough to reason flexibly across available tools, or were more likely constrained from doing so by the system design.</p><p>That constraint is loosening as vendors realise the capabilities of these new models. And the response is coming from multiple directions simultaneously.</p><p><strong>Vendors</strong> of specialised academic search tools face a strategic choice. They can make their products available as components in user-built agentic workflows &#8212; typically by providing MCP servers, as <a href="https://scite.ai/mcp">Scite</a>, <a href="https://consensus.app/home/mcp/">Consensus</a>, and SciSpace have done, <a href="https://elicit.com/blog/elicit-api">or APIs, as Elicit has (currently in beta)</a>.   </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7zLD!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7zLD!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png 424w, https://substackcdn.com/image/fetch/$s_!7zLD!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png 848w, https://substackcdn.com/image/fetch/$s_!7zLD!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png 1272w, https://substackcdn.com/image/fetch/$s_!7zLD!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7zLD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png" width="771" height="485" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:485,&quot;width&quot;:771,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:31991,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7zLD!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png 424w, https://substackcdn.com/image/fetch/$s_!7zLD!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png 848w, https://substackcdn.com/image/fetch/$s_!7zLD!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png 1272w, https://substackcdn.com/image/fetch/$s_!7zLD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F590d0c95-c002-474c-b360-f211e5b8fa2c_771x485.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!HKRh!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!HKRh!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png 424w, https://substackcdn.com/image/fetch/$s_!HKRh!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png 848w, https://substackcdn.com/image/fetch/$s_!HKRh!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png 1272w, https://substackcdn.com/image/fetch/$s_!HKRh!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!HKRh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png" width="1327" height="587" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:587,&quot;width&quot;:1327,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:49702,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!HKRh!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png 424w, https://substackcdn.com/image/fetch/$s_!HKRh!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png 848w, https://substackcdn.com/image/fetch/$s_!HKRh!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png 1272w, https://substackcdn.com/image/fetch/$s_!HKRh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F32e155ba-d113-4036-87ca-0ee0c68dbae7_1327x587.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!XONH!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!XONH!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png 424w, https://substackcdn.com/image/fetch/$s_!XONH!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png 848w, https://substackcdn.com/image/fetch/$s_!XONH!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png 1272w, https://substackcdn.com/image/fetch/$s_!XONH!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!XONH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png" width="1106" height="730" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:730,&quot;width&quot;:1106,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:347585,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!XONH!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png 424w, https://substackcdn.com/image/fetch/$s_!XONH!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png 848w, https://substackcdn.com/image/fetch/$s_!XONH!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png 1272w, https://substackcdn.com/image/fetch/$s_!XONH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e469cdf-be9a-4cf5-b737-eeb0d4088f4d_1106x730.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><blockquote><p>&#8220;<a href="https://library.smu.edu.sg/topics-insights/what-if-claude-or-chatgpt-could-search-academic-databases-you-and-then-do-something">What If Claude or ChatGPT Could Search Academic Databases For You &#8212; and Then Do Something Useful With the Results?</a>&#8221; is a simple guide I wrote for our users.</p></blockquote><p>But they also want to maintain the value of their own platforms rather than becoming a commodity connector inside Claude or ChatGPT. Being just one MCP server among many risks ceding control of the user experience and, ultimately, the business relationship. Their response, increasingly, is to try to have it both ways: offer the connector while also making their own platform more agentic. Even publishers are moving in this direction &#8212; <a href="https://www.wiley.com/en-us/solutions-partnerships/ai-solutions/">Wiley AI Gateway</a>, is one of the earliest academic MCP server adopters, though as a publisher rather than a search aggregator, their interests are fundamentally different from tools like Scite, Consensus, or SciSpace and Wiley&#8217;s MCP server returns full text chunks that may be relevant to the query on top of metadata of the paper (see <a href="https://aarontay.substack.com/p/mcp-servers-and-academic-search-the">my earlier review</a>). </p><p><strong>Libraries</strong> are not standing still either. <a href="https://liblablexicon.wordpress.com/2026/04/02/what-happens-when-ai-can-use-the-library/">UT Libraries has built a working demonstration connecting Claude to their library catalogue (Primo/Alma), Texas Archival Resources Online, their digital collections, and the Harry Ransom Center Digital Collections </a>&#8212; it can even identify the right subject librarian and give instructions for accessing archives. </p><div id="youtube2-XcNc40Kr3DU" class="youtube-wrap" data-attrs="{&quot;videoId&quot;:&quot;XcNc40Kr3DU&quot;,&quot;startTime&quot;:null,&quot;endTime&quot;:null}" data-component-name="Youtube2ToDOM"><div class="youtube-inner"><iframe src="https://www.youtube-nocookie.com/embed/XcNc40Kr3DU?rel=0&amp;autoplay=0&amp;showinfo=0&amp;enablejsapi=0" frameborder="0" loading="lazy" gesture="media" allow="autoplay; fullscreen" allowautoplay="true" allowfullscreen="true" width="728" height="409"></iframe></div></div><p><a href="https://library.yale.edu/news/yale-library-testing-ai-powered-connection-deeper-searching-library-resources">Yale University Libraries is piloting a similar MCP connector to their catalogue</a>, <a href="https://consensus.app/home/mcp/">alongside a year-long trial of Consensus.app</a>. If libraries can wire LLMs directly to their collections, the role of intermediary search platforms becomes less certain.</p><h2>The benchmark test: finding uncited papers</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!oUWV!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!oUWV!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png 424w, https://substackcdn.com/image/fetch/$s_!oUWV!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png 848w, https://substackcdn.com/image/fetch/$s_!oUWV!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png 1272w, https://substackcdn.com/image/fetch/$s_!oUWV!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!oUWV!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png" width="1209" height="679" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/eeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:679,&quot;width&quot;:1209,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1012517,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!oUWV!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png 424w, https://substackcdn.com/image/fetch/$s_!oUWV!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png 848w, https://substackcdn.com/image/fetch/$s_!oUWV!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png 1272w, https://substackcdn.com/image/fetch/$s_!oUWV!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feeda2da4-fdfa-40d9-b935-686ad79a6016_1209x679.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Before examining each tool, let me explain <a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">the test I have used in the past</a> and use throughout this post. The task is: given an open access paper X, find papers that could have been cited in X but were not</p><p>This is a useful yet simple test of agentic capability for several reasons. First, I don&#8217;t believe it is  a [predefined workflow that any vendor has pre-built, so the system must reason about how to accomplish it rather than following a script. Second, it requires genuine multi-step reasoning: the system must extract the references of paper X, search for papers on similar topics published before X, and then ensure that the papers it presents are not already in the reference list. Third, the target paper I use &#8212; "<a href="https://peerj.com/articles/4375/">The state of OA: a large-scale analysis of the prevalence and impact of Open Access articles</a>" &#8212; is open access and easily accessible, so even if the model lacks a specialised search tool to retrieve the references directly, it should be able to find them via a web search.</p><p>I should note its many limitations. This is a single task type that tests one kind of multi-step reasoning. A tool could fail this test and still perform well on other agentic tasks, or pass it through a fortunate sequence of actions rather than robust reasoning<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>. It is a useful probe, not a comprehensive evaluation.</p><h2>Elicit Research Agents</h2><p>Elicit has long been known for providing tailored workflows with human-in-the-loop features. They have expanded the sources they can search, <a href="https://elicit.com/blog/clinical-trials">going beyond their own academic index to include clinical trials</a>, PubMed, and the web. Most recently, <a href="https://elicit.com/blog/introducing-research-agent-workflows">they added &#8220;Research Agents,&#8221;</a> which appear to be agentic in the way generic LLMs are, combining available tools or workflows flexibly to solve tasks rather than following a fixed pipeline.</p><p>I tested Elicit with my usual test, and found the following prompt usually works:</p><p><code>Search the web find the references of the paper &#8220;The state of OA: a large-scale analysis of the prevalence and impact of Open Access articles.&#8221; Find papers that could have been cited but were not.</code></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!WWcs!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!WWcs!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png 424w, https://substackcdn.com/image/fetch/$s_!WWcs!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png 848w, https://substackcdn.com/image/fetch/$s_!WWcs!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png 1272w, https://substackcdn.com/image/fetch/$s_!WWcs!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!WWcs!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png" width="502" height="922" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:922,&quot;width&quot;:502,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!WWcs!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png 424w, https://substackcdn.com/image/fetch/$s_!WWcs!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png 848w, https://substackcdn.com/image/fetch/$s_!WWcs!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png 1272w, https://substackcdn.com/image/fetch/$s_!WWcs!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F56f26756-93e8-4b21-9e6c-88c4b5d470f9_502x922.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The critical detail here is &#8220;search the web.&#8221; Without that instruction, Elicit defaults to its academic search tool, which can find the paper but cannot give the agent access to its references. Screenshot below shows what happens if it uses the Elicit academic search.</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mVi7!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mVi7!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png 424w, https://substackcdn.com/image/fetch/$s_!mVi7!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png 848w, https://substackcdn.com/image/fetch/$s_!mVi7!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png 1272w, https://substackcdn.com/image/fetch/$s_!mVi7!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mVi7!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png" width="655" height="207" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/be4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:207,&quot;width&quot;:655,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mVi7!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png 424w, https://substackcdn.com/image/fetch/$s_!mVi7!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png 848w, https://substackcdn.com/image/fetch/$s_!mVi7!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png 1272w, https://substackcdn.com/image/fetch/$s_!mVi7!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbe4fb7c7-a426-40df-b2ab-5a94b4530f79_655x207.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>If you instead direct it to use its web tool, it behaves like any LLM with web access: it finds the full text of the paper, extracts the references, and proceeds with the task.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!hliw!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!hliw!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png 424w, https://substackcdn.com/image/fetch/$s_!hliw!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png 848w, https://substackcdn.com/image/fetch/$s_!hliw!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png 1272w, https://substackcdn.com/image/fetch/$s_!hliw!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!hliw!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png" width="1200" height="668" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:668,&quot;width&quot;:1200,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:596451,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!hliw!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png 424w, https://substackcdn.com/image/fetch/$s_!hliw!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png 848w, https://substackcdn.com/image/fetch/$s_!hliw!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png 1272w, https://substackcdn.com/image/fetch/$s_!hliw!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7226947-0188-43a2-b613-d2c8d75b5c1e_1200x668.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This is a first early example of what I will be calling &#8220;the invisible menu" problem. The user has no obvious way of knowing that Elicit&#8217;s academic search tool cannot extract references from a paper, or that switching to the web tool solves the problem. The system has the capability, but the user must guess the right incantation to unlock it.</p><h2>Undermind Projects</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!-atc!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!-atc!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png 424w, https://substackcdn.com/image/fetch/$s_!-atc!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png 848w, https://substackcdn.com/image/fetch/$s_!-atc!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png 1272w, https://substackcdn.com/image/fetch/$s_!-atc!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!-atc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png" width="1201" height="673" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:673,&quot;width&quot;:1201,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:978235,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!-atc!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png 424w, https://substackcdn.com/image/fetch/$s_!-atc!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png 848w, https://substackcdn.com/image/fetch/$s_!-atc!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png 1272w, https://substackcdn.com/image/fetch/$s_!-atc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36c4bc2-92a6-4dcf-a80b-387f25fb9744_1201x673.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Undermind recently added a beta "Projects" feature that represents a more substantial move towards agentic architecture. Unlike the current Undermind, which offers essentially one workflow (enter a query, answer clarifying questions, receive a report), the Projects feature provides three agents: a Search Architect, a Report Writer, and a Generalist.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!qpUH!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!qpUH!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png 424w, https://substackcdn.com/image/fetch/$s_!qpUH!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png 848w, https://substackcdn.com/image/fetch/$s_!qpUH!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png 1272w, https://substackcdn.com/image/fetch/$s_!qpUH!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!qpUH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png" width="1456" height="677" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:677,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!qpUH!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png 424w, https://substackcdn.com/image/fetch/$s_!qpUH!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png 848w, https://substackcdn.com/image/fetch/$s_!qpUH!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png 1272w, https://substackcdn.com/image/fetch/$s_!qpUH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b7d736f-34ed-485b-9984-485fafd6908a_1813x843.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The <strong>Search Architect</strong> is designed to ask clarifying questions and eventually propose a "deep search," which is Undermind's full search capability rather than a standard LLM web search.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!CWgj!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!CWgj!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png 424w, https://substackcdn.com/image/fetch/$s_!CWgj!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png 848w, https://substackcdn.com/image/fetch/$s_!CWgj!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png 1272w, https://substackcdn.com/image/fetch/$s_!CWgj!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!CWgj!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png" width="627" height="400" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f295048b-7dab-4906-a094-364f8bda4f7d_627x400.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:400,&quot;width&quot;:627,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!CWgj!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png 424w, https://substackcdn.com/image/fetch/$s_!CWgj!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png 848w, https://substackcdn.com/image/fetch/$s_!CWgj!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png 1272w, https://substackcdn.com/image/fetch/$s_!CWgj!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff295048b-7dab-4906-a094-364f8bda4f7d_627x400.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The <strong>Report Writer</strong> works with papers found from past searches to generate reports in the format and structure you want. Like the Search Architect, it typically asks clarifying questions before proceeding.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!QJXg!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!QJXg!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png 424w, https://substackcdn.com/image/fetch/$s_!QJXg!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png 848w, https://substackcdn.com/image/fetch/$s_!QJXg!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png 1272w, https://substackcdn.com/image/fetch/$s_!QJXg!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!QJXg!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png" width="598" height="454" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:454,&quot;width&quot;:598,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:20291,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/192175020?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!QJXg!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png 424w, https://substackcdn.com/image/fetch/$s_!QJXg!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png 848w, https://substackcdn.com/image/fetch/$s_!QJXg!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png 1272w, https://substackcdn.com/image/fetch/$s_!QJXg!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f73e715-5a7c-4073-9841-fad4a2ca1797_598x454.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The <strong>Generalist</strong> is less clearly defined, but it has access to every paper across all your searches. In practice, the LLMs are capable of calling each other when needed &#8212; you might be interacting with the Search Architect, but once a search completes, it may recommend switching to the Report Writer.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Y1h_!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Y1h_!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png 424w, https://substackcdn.com/image/fetch/$s_!Y1h_!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png 848w, https://substackcdn.com/image/fetch/$s_!Y1h_!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png 1272w, https://substackcdn.com/image/fetch/$s_!Y1h_!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Y1h_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png" width="618" height="391" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:391,&quot;width&quot;:618,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Y1h_!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png 424w, https://substackcdn.com/image/fetch/$s_!Y1h_!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png 848w, https://substackcdn.com/image/fetch/$s_!Y1h_!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png 1272w, https://substackcdn.com/image/fetch/$s_!Y1h_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F73acd830-16a8-4dfc-96e1-3dd3867f1a14_618x391.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h3>Why this matters</h3><p>One of the most significant advance here is not any single agent but the ability to run multiple searches and combine the results. One longstanding piece of advice I give to users of the current Undermind is to ensure your query covers a fairly focused topic, expecting perhaps 10-50 relevant papers. A broad query like "how are LLMs used in evidence synthesis" is too unfocused; LLMs are used differently at different stages.</p><p>With the Search Architect, you can attack a broad research question (e.g. how are LLMs used in evidence synthesis) by running multiple focused searches to address different sub-questions:</p><p>a) How well do LLMs perform as title-abstract screeners in evidence synthesis?</p><p>b) How well do LLMs perform when generating Boolean search strategies for evidence synthesis?</p><p>c) How well do LLMs perform at data extraction in evidence synthesis?</p><p>d) How well do LLMs perform in critical appraisal for evidence synthesis?</p><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!g0Bi!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!g0Bi!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png 424w, https://substackcdn.com/image/fetch/$s_!g0Bi!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png 848w, https://substackcdn.com/image/fetch/$s_!g0Bi!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png 1272w, https://substackcdn.com/image/fetch/$s_!g0Bi!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!g0Bi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png" width="606" height="887" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:887,&quot;width&quot;:606,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!g0Bi!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png 424w, https://substackcdn.com/image/fetch/$s_!g0Bi!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png 848w, https://substackcdn.com/image/fetch/$s_!g0Bi!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png 1272w, https://substackcdn.com/image/fetch/$s_!g0Bi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0dabd3f3-ce93-4597-aba9-c7c09002673e_606x887.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!B0tJ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!B0tJ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png 424w, https://substackcdn.com/image/fetch/$s_!B0tJ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png 848w, https://substackcdn.com/image/fetch/$s_!B0tJ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png 1272w, https://substackcdn.com/image/fetch/$s_!B0tJ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!B0tJ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png" width="1066" height="866" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:866,&quot;width&quot;:1066,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:95470,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!B0tJ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png 424w, https://substackcdn.com/image/fetch/$s_!B0tJ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png 848w, https://substackcdn.com/image/fetch/$s_!B0tJ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png 1272w, https://substackcdn.com/image/fetch/$s_!B0tJ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffde081a6-65fe-4a19-bfd9-ed1df8b5fcbe_1066x866.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>All results feed into a unified &#8220;All papers&#8221; library.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ZBc-!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ZBc-!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png 424w, https://substackcdn.com/image/fetch/$s_!ZBc-!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png 848w, https://substackcdn.com/image/fetch/$s_!ZBc-!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png 1272w, https://substackcdn.com/image/fetch/$s_!ZBc-!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ZBc-!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png" width="1078" height="743" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:743,&quot;width&quot;:1078,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ZBc-!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png 424w, https://substackcdn.com/image/fetch/$s_!ZBc-!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png 848w, https://substackcdn.com/image/fetch/$s_!ZBc-!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png 1272w, https://substackcdn.com/image/fetch/$s_!ZBc-!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F93460916-42d8-46a0-b27f-642cdf101b74_1078x743.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Lastly the Report Writer can then synthesise across them.  This part is very similar to the &#8220;Chat with experts&#8221; feature in the original Undermind, you can select predefined instructions to focus on different aspects for the report.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!QPAi!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!QPAi!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png 424w, https://substackcdn.com/image/fetch/$s_!QPAi!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png 848w, https://substackcdn.com/image/fetch/$s_!QPAi!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png 1272w, https://substackcdn.com/image/fetch/$s_!QPAi!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!QPAi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png" width="843" height="726" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:726,&quot;width&quot;:843,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:36325,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!QPAi!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png 424w, https://substackcdn.com/image/fetch/$s_!QPAi!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png 848w, https://substackcdn.com/image/fetch/$s_!QPAi!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png 1272w, https://substackcdn.com/image/fetch/$s_!QPAi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff7c15d24-fcfa-423e-91c8-c0dbc353beec_843x726.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> It will also ask clarifying questions.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!GDQh!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!GDQh!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png 424w, https://substackcdn.com/image/fetch/$s_!GDQh!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png 848w, https://substackcdn.com/image/fetch/$s_!GDQh!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png 1272w, https://substackcdn.com/image/fetch/$s_!GDQh!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!GDQh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png" width="847" height="882" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:882,&quot;width&quot;:847,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:53589,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!GDQh!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png 424w, https://substackcdn.com/image/fetch/$s_!GDQh!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png 848w, https://substackcdn.com/image/fetch/$s_!GDQh!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png 1272w, https://substackcdn.com/image/fetch/$s_!GDQh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e3717c1-2f89-44ca-8121-da4cc45a598f_847x882.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!J5G9!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!J5G9!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png 424w, https://substackcdn.com/image/fetch/$s_!J5G9!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png 848w, https://substackcdn.com/image/fetch/$s_!J5G9!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png 1272w, https://substackcdn.com/image/fetch/$s_!J5G9!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!J5G9!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png" width="1050" height="905" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:905,&quot;width&quot;:1050,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!J5G9!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png 424w, https://substackcdn.com/image/fetch/$s_!J5G9!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png 848w, https://substackcdn.com/image/fetch/$s_!J5G9!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png 1272w, https://substackcdn.com/image/fetch/$s_!J5G9!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd77da5f1-43ae-4638-a6c4-eba88d3c971c_1050x905.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h3>Test result</h3><p>I tested Undermind Projects with my standard query: find papers that could have been cited in &#8220;The state of OA&#8221; paper but were not.</p><p><code>find me papers that could have been cited in the paper &#8220;The state of OA: a large-scale analysis of the prevalence and impact of Open Access articles.&#8221; but was not</code></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mKXT!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mKXT!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png 424w, https://substackcdn.com/image/fetch/$s_!mKXT!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png 848w, https://substackcdn.com/image/fetch/$s_!mKXT!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png 1272w, https://substackcdn.com/image/fetch/$s_!mKXT!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mKXT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png" width="567" height="384" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:384,&quot;width&quot;:567,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mKXT!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png 424w, https://substackcdn.com/image/fetch/$s_!mKXT!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png 848w, https://substackcdn.com/image/fetch/$s_!mKXT!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png 1272w, https://substackcdn.com/image/fetch/$s_!mKXT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91e7a311-5012-4958-8858-0f501ef1f5c7_567x384.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The system asked clarifying questions, then read the full text of the target paper (identified as &#8220;piw18&#8221; in its system). </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!0vXi!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!0vXi!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png 424w, https://substackcdn.com/image/fetch/$s_!0vXi!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png 848w, https://substackcdn.com/image/fetch/$s_!0vXi!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png 1272w, https://substackcdn.com/image/fetch/$s_!0vXi!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!0vXi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png" width="716" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/a36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:716,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!0vXi!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png 424w, https://substackcdn.com/image/fetch/$s_!0vXi!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png 848w, https://substackcdn.com/image/fetch/$s_!0vXi!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png 1272w, https://substackcdn.com/image/fetch/$s_!0vXi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa36f2513-67de-46a8-bdc2-3e1af6cd0e4c_716x559.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>After further clarification, it offered to launch a deep search, which I did.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!e4fn!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!e4fn!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png 424w, https://substackcdn.com/image/fetch/$s_!e4fn!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png 848w, https://substackcdn.com/image/fetch/$s_!e4fn!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png 1272w, https://substackcdn.com/image/fetch/$s_!e4fn!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!e4fn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png" width="704" height="1009" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1009,&quot;width&quot;:704,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!e4fn!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png 424w, https://substackcdn.com/image/fetch/$s_!e4fn!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png 848w, https://substackcdn.com/image/fetch/$s_!e4fn!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png 1272w, https://substackcdn.com/image/fetch/$s_!e4fn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7379f6f-ce5b-4be9-a332-7140ded07175_704x1009.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>At this point, I was uncertain whether the request would succeed. Undermind&#8217;s deep search is capable of finding papers on a similar topic and filtering to papers published before the target, but it cannot by itself filter out papers already cited.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!z34W!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!z34W!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png 424w, https://substackcdn.com/image/fetch/$s_!z34W!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png 848w, https://substackcdn.com/image/fetch/$s_!z34W!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png 1272w, https://substackcdn.com/image/fetch/$s_!z34W!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!z34W!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png" width="1456" height="732" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:732,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!z34W!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png 424w, https://substackcdn.com/image/fetch/$s_!z34W!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png 848w, https://substackcdn.com/image/fetch/$s_!z34W!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png 1272w, https://substackcdn.com/image/fetch/$s_!z34W!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4ef2d5ab-8c17-4a52-8b60-94ea2348e6a1_1658x834.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Once the search finished, the Generalist agent suggested running a report. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!VM66!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!VM66!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png 424w, https://substackcdn.com/image/fetch/$s_!VM66!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png 848w, https://substackcdn.com/image/fetch/$s_!VM66!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png 1272w, https://substackcdn.com/image/fetch/$s_!VM66!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!VM66!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png" width="1456" height="682" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/da1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:682,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!VM66!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png 424w, https://substackcdn.com/image/fetch/$s_!VM66!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png 848w, https://substackcdn.com/image/fetch/$s_!VM66!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png 1272w, https://substackcdn.com/image/fetch/$s_!VM66!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda1d31c3-3657-4e8d-a080-b69116e95d29_1884x882.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I proceeded by clicking on the &#8220;Generate Report&#8221; button, and started prompting in the Report writer agent.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7my3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7my3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png 424w, https://substackcdn.com/image/fetch/$s_!7my3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png 848w, https://substackcdn.com/image/fetch/$s_!7my3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png 1272w, https://substackcdn.com/image/fetch/$s_!7my3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7my3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png" width="749" height="542" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:542,&quot;width&quot;:749,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7my3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png 424w, https://substackcdn.com/image/fetch/$s_!7my3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png 848w, https://substackcdn.com/image/fetch/$s_!7my3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png 1272w, https://substackcdn.com/image/fetch/$s_!7my3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1e8d63cb-f56d-46f0-aa60-ca6de946b0c5_749x542.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The report writer did its usual clarifying questions</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!9yn3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!9yn3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png 424w, https://substackcdn.com/image/fetch/$s_!9yn3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png 848w, https://substackcdn.com/image/fetch/$s_!9yn3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png 1272w, https://substackcdn.com/image/fetch/$s_!9yn3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!9yn3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png" width="797" height="666" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:666,&quot;width&quot;:797,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!9yn3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png 424w, https://substackcdn.com/image/fetch/$s_!9yn3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png 848w, https://substackcdn.com/image/fetch/$s_!9yn3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png 1272w, https://substackcdn.com/image/fetch/$s_!9yn3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4bc4231c-2277-4915-adda-fdca8a6b0919_797x666.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The critical step came when the agent began &#8220;reading full texts of Piw18&#8221; &#8212; it was checking candidate papers against both the in-text citations and bibliography of the target paper. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!jJyF!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!jJyF!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png 424w, https://substackcdn.com/image/fetch/$s_!jJyF!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png 848w, https://substackcdn.com/image/fetch/$s_!jJyF!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png 1272w, https://substackcdn.com/image/fetch/$s_!jJyF!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!jJyF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png" width="791" height="583" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:583,&quot;width&quot;:791,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!jJyF!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png 424w, https://substackcdn.com/image/fetch/$s_!jJyF!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png 848w, https://substackcdn.com/image/fetch/$s_!jJyF!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png 1272w, https://substackcdn.com/image/fetch/$s_!jJyF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F03e3d75e-a0c6-4d46-93ca-d9030e01eaa5_791x583.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>For example, Archambault et al. 2016 (Arc16), found by the deep search, was checked against piw18 and excluded because it was already cited.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!XvqT!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!XvqT!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png 424w, https://substackcdn.com/image/fetch/$s_!XvqT!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png 848w, https://substackcdn.com/image/fetch/$s_!XvqT!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png 1272w, https://substackcdn.com/image/fetch/$s_!XvqT!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!XvqT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png" width="781" height="473" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:473,&quot;width&quot;:781,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!XvqT!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png 424w, https://substackcdn.com/image/fetch/$s_!XvqT!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png 848w, https://substackcdn.com/image/fetch/$s_!XvqT!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png 1272w, https://substackcdn.com/image/fetch/$s_!XvqT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F41a8916d-9bd8-4193-baf5-2f80f859bb3b_781x473.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The system passed the test, but my testing of the new Undermind interface revealed several problems along the way.</p><h3>Invisible menu problems in Undermind Projects and probably other agentic interfaces.</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!a49D!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!a49D!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png 424w, https://substackcdn.com/image/fetch/$s_!a49D!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png 848w, https://substackcdn.com/image/fetch/$s_!a49D!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png 1272w, https://substackcdn.com/image/fetch/$s_!a49D!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!a49D!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png" width="1207" height="675" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:675,&quot;width&quot;:1207,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1108540,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!a49D!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png 424w, https://substackcdn.com/image/fetch/$s_!a49D!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png 848w, https://substackcdn.com/image/fetch/$s_!a49D!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png 1272w, https://substackcdn.com/image/fetch/$s_!a49D!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0598ecc1-aea4-4b8e-87f3-a1553eae4cbe_1207x675.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>While testing, I found myself uncertain about basic questions of system capability. Can you give prompts to the Report Writer that refer to specific papers using their keys (e.g. piw18)? Can you reference reports or searches that have already been completed? Can you ask the Report Writer to modify an existing report rather than creating a new one?</p><p>The answers to all of these turned out to be yes, which I confirmed by trying and then checking with the developers. For instance, you can ask the Report Writer to use results from a particular search and create a report with "a table of the most relevant papers, each with a column describing possible limitations and why it might not fully address my research goal." You can then ask it to add more sections to the same report. Some of these capabilities are surfaced by the system &#8212; it sometimes asks whether you want a new report or to extend an existing one, or even shown as a GUI feature &#8212; but not all of them are.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!OWVU!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!OWVU!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png 424w, https://substackcdn.com/image/fetch/$s_!OWVU!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png 848w, https://substackcdn.com/image/fetch/$s_!OWVU!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png 1272w, https://substackcdn.com/image/fetch/$s_!OWVU!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!OWVU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png" width="844" height="533" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:533,&quot;width&quot;:844,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:73849,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!OWVU!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png 424w, https://substackcdn.com/image/fetch/$s_!OWVU!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png 848w, https://substackcdn.com/image/fetch/$s_!OWVU!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png 1272w, https://substackcdn.com/image/fetch/$s_!OWVU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb014b14b-059c-4025-8fd8-00fe27424d2c_844x533.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I also raised with the Undermind developers that the new system requires more effort to get the same output as the current one. Under the old system, you enter a query, answer clarifying questions, and receive a comprehensive report. Under the Projects system, you must additionally run the Report Writer, potentially multiple times, each time being asked for clarification.</p><p>I requested something like a Claude.md or Claude Skill &#8212; a way to specify in advance the sections and structure I wanted, so I could get the full report in one shot. Undermind is still considering this, but the developers revealed a useful workaround: the Generalist agent has access to all the same resources as the Report Writer, but is much less likely to ask clarifying questions. If you want to bypass the Report Writer&#8217;s clarification loop, give the same instructions to the Generalist instead.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!EOvv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!EOvv!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png 424w, https://substackcdn.com/image/fetch/$s_!EOvv!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png 848w, https://substackcdn.com/image/fetch/$s_!EOvv!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png 1272w, https://substackcdn.com/image/fetch/$s_!EOvv!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!EOvv!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png" width="1183" height="655" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:655,&quot;width&quot;:1183,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:649775,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!EOvv!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png 424w, https://substackcdn.com/image/fetch/$s_!EOvv!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png 848w, https://substackcdn.com/image/fetch/$s_!EOvv!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png 1272w, https://substackcdn.com/image/fetch/$s_!EOvv!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F39bbbe93-8c9f-4503-ab98-efa21b86b0db_1183x655.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This is a genuinely useful tip. It is also not the sort of capability most users, even experienced ones, would be likely to discover on their own. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!jbfa!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!jbfa!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png 424w, https://substackcdn.com/image/fetch/$s_!jbfa!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png 848w, https://substackcdn.com/image/fetch/$s_!jbfa!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png 1272w, https://substackcdn.com/image/fetch/$s_!jbfa!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!jbfa!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png" width="1200" height="679" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:679,&quot;width&quot;:1200,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:884812,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!jbfa!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png 424w, https://substackcdn.com/image/fetch/$s_!jbfa!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png 848w, https://substackcdn.com/image/fetch/$s_!jbfa!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png 1272w, https://substackcdn.com/image/fetch/$s_!jbfa!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F09de79ca-1b1b-4332-a6d2-b121a87894e1_1200x679.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2>The invisible menu problem</h2><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mobk!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mobk!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!mobk!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!mobk!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!mobk!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mobk!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:7645363,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mobk!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!mobk!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!mobk!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!mobk!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63df3987-e56b-4ac8-bf9d-007cc38dd106_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Imagine walking into a restaurant that has no menu. You know the kitchen can cook, but you have no idea what dishes are available, what ingredients they have, or what you should ask for. You might get a brilliant meal if you happen to request the right thing, or you might miss the house speciality entirely because it never occurred to you to ask.</p><p>Now make it worse: you do not even know what type of cuisine this restaurant serves. Is it Thai? Italian? Fusion? The sign outside just says &#8220;food.&#8221; That is the situation users face with agentic search tools today.</p><blockquote><p>Compare this to a user who setups Claude Code by hand to do agentic flows, in our analogy, he would be the owner of the restaurant, and he knows how the resturant was setup, who the cooks are, what their specialities are etc. If he just copies the Claude Code workflow from someone else without understanding - we will be back to the same issue of course.</p></blockquote><p>As I noted in the introduction, I previously called this the &#8220;blank box&#8221; problem, but &#8220;invisible menu&#8221; better captures what is going on. The issue is not that the system is blank or empty &#8212; it is full of capabilities. The problem is that there is no menu to tell you what they are.</p><p>The invisible menu problem arises because an agentic system&#8217;s capability space is so broad that users struggle to find out what is possible through normal interaction <em>and is worsened if the user were not the one who setup the agentic system and hence does not understand even in principle what is possible.</em></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!1KKC!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!1KKC!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png 424w, https://substackcdn.com/image/fetch/$s_!1KKC!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png 848w, https://substackcdn.com/image/fetch/$s_!1KKC!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png 1272w, https://substackcdn.com/image/fetch/$s_!1KKC!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!1KKC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png" width="1209" height="671" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:671,&quot;width&quot;:1209,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:713743,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!1KKC!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png 424w, https://substackcdn.com/image/fetch/$s_!1KKC!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png 848w, https://substackcdn.com/image/fetch/$s_!1KKC!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png 1272w, https://substackcdn.com/image/fetch/$s_!1KKC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4fc7067d-43b7-4e8a-8667-f2fc4870ba63_1209x671.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The system can do things the user will never discover if there are no menus, no buttons, no tooltips &#8212; just a prompt field. The user must guess what to order. This is illustrated by all three examples from this post: knowing to say "search the web" in Elicit, knowing that paper keys work as references in Undermind, knowing that the Generalist agent bypasses the Report Writer's clarification loop. In each case, the capability exists but is invisible to normal use.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!RX2t!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!RX2t!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png 424w, https://substackcdn.com/image/fetch/$s_!RX2t!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png 848w, https://substackcdn.com/image/fetch/$s_!RX2t!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png 1272w, https://substackcdn.com/image/fetch/$s_!RX2t!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!RX2t!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png" width="1204" height="688" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/abfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:688,&quot;width&quot;:1204,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1061895,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!RX2t!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png 424w, https://substackcdn.com/image/fetch/$s_!RX2t!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png 848w, https://substackcdn.com/image/fetch/$s_!RX2t!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png 1272w, https://substackcdn.com/image/fetch/$s_!RX2t!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fabfa89e2-1c8a-4a93-82db-cda5b8f1b122_1204x688.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em>Compounding this, users cannot even fall back on conventions from elsewhere. With traditional library search tools, there is a shared mental model.</em> Users know roughly what to expect from a discovery layer or a database: keyword search, date filters, subject headings, citation export. The specifics differ between Primo, EDS, and Summon, but decades of use have established conventions, and a user moving from one system to another can transfer most of their expectations. </p><p><em>With agentic search tools, no such shared mental model currently exists. </em>Every tool has a different set of capabilities, different tools connected underneath, and different invisible constraints. Users cannot form reasonable expectations before they start, which makes the per-tool discovery problem even harder.</p><p>Consider how the user does not know what system instructions each agent is already given, what tools or sources it has access to and more etc and is either going to not use the system&#8217;s agent capabilities to the fullest or on the flipside give prompts or inputs expecting to be doable but failing. This can be particularly dangerous because such agentic systems often &#8220;fail silently&#8221; or even if they state plainly they failed, the user may not notice this failure.</p><blockquote><p>Advanced users setting up their own agentic flows with Claude Code or Sciclaw will not face this issue as much, as they know exactly what and how it has been setup.</p></blockquote><p>Undermind features an 'agentic sources' button that surfaces example prompts, mitigating the invisible menu problem by explicitly showing users that they can reference paper keys</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!FvWl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!FvWl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png 424w, https://substackcdn.com/image/fetch/$s_!FvWl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png 848w, https://substackcdn.com/image/fetch/$s_!FvWl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png 1272w, https://substackcdn.com/image/fetch/$s_!FvWl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!FvWl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png" width="590" height="442" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:442,&quot;width&quot;:590,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:20934,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!FvWl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png 424w, https://substackcdn.com/image/fetch/$s_!FvWl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png 848w, https://substackcdn.com/image/fetch/$s_!FvWl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png 1272w, https://substackcdn.com/image/fetch/$s_!FvWl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F274107db-f922-4a35-9c2a-f3b176bd3db9_590x442.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Below shows what happens when you click on that.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!zzE6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!zzE6!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png 424w, https://substackcdn.com/image/fetch/$s_!zzE6!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png 848w, https://substackcdn.com/image/fetch/$s_!zzE6!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png 1272w, https://substackcdn.com/image/fetch/$s_!zzE6!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!zzE6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png" width="447" height="367" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ea470092-730f-4253-b45b-210aa0860a2e_447x367.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:367,&quot;width&quot;:447,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:20594,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!zzE6!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png 424w, https://substackcdn.com/image/fetch/$s_!zzE6!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png 848w, https://substackcdn.com/image/fetch/$s_!zzE6!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png 1272w, https://substackcdn.com/image/fetch/$s_!zzE6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea470092-730f-4253-b45b-210aa0860a2e_447x367.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The screenshot gives you example prompts that give you cues on what you can do. For example, this popup reveals you can give instructions to the Report Writer by referring to the paper key in the Undermind Library.</p><p>There is not yet a well-established baseline for what an agentic research tool does that users can carry from one product to another. Users cannot even form reasonable expectations before they start.</p><p>This is distinct from the well-known &#8220;black box&#8221; problem of AI opacity. A black box hides how the system reaches its output. An invisible menu hides what the system can do in the first place. Both are problems, but the invisible menu problem is specific to agentic systems and, I think, currently underappreciated.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!b3_h!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!b3_h!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png 424w, https://substackcdn.com/image/fetch/$s_!b3_h!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png 848w, https://substackcdn.com/image/fetch/$s_!b3_h!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png 1272w, https://substackcdn.com/image/fetch/$s_!b3_h!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!b3_h!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png" width="1211" height="675" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:675,&quot;width&quot;:1211,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1124124,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!b3_h!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png 424w, https://substackcdn.com/image/fetch/$s_!b3_h!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png 848w, https://substackcdn.com/image/fetch/$s_!b3_h!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png 1272w, https://substackcdn.com/image/fetch/$s_!b3_h!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6cc710fb-2718-4d23-bffc-880dc4295a69_1211x675.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>It also has direct implications for reproducibility and trust. If the user does not know what the system did, what tools it invoked, or what alternative paths it could have taken, how can they evaluate whether the output is reliable? With a fixed workflow, the steps are predictable and auditable. With an agentic system, the tool may take different paths each time, and the user may not even realise what choices were made on their behalf.</p><p>Part of this may prove temporary. As these tools mature, shared expectations across the category will form, and users will at least arrive with a baseline of what to expect. What will not go away on its own is the per-tool discovery problem: even with category conventions in place, each system will still have its own hidden affordances unless vendors deliberately surface them. In the interim, the cognitive burden on users is substantial.</p><h2>SciSpace Agents</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!sPtX!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!sPtX!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png 424w, https://substackcdn.com/image/fetch/$s_!sPtX!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png 848w, https://substackcdn.com/image/fetch/$s_!sPtX!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png 1272w, https://substackcdn.com/image/fetch/$s_!sPtX!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!sPtX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png" width="1192" height="667" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:667,&quot;width&quot;:1192,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1203056,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!sPtX!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png 424w, https://substackcdn.com/image/fetch/$s_!sPtX!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png 848w, https://substackcdn.com/image/fetch/$s_!sPtX!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png 1272w, https://substackcdn.com/image/fetch/$s_!sPtX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd0c3169d-c493-4b80-8d1c-14abcf0c8fcc_1192x667.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>I should be upfront that I have not tested SciSpace Agents as deeply as Elicit or Undermind, so what follows is a positioning analysis rather than a hands-on evaluation.</p><p><a href="https://scispace.com/">SciSpace has gone all-in on the agentic model</a>. Their platform is packed with over 150 &#8220;apps&#8221; and connectors to a wide range of tools and agents that go well beyond literature review<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-3" href="#footnote-3" target="_self">3</a> &#8212; searching, writing, data analysis, and more. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!xw4p!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!xw4p!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png 424w, https://substackcdn.com/image/fetch/$s_!xw4p!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png 848w, https://substackcdn.com/image/fetch/$s_!xw4p!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png 1272w, https://substackcdn.com/image/fetch/$s_!xw4p!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!xw4p!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png" width="700" height="1058" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/a9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1058,&quot;width&quot;:700,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!xw4p!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png 424w, https://substackcdn.com/image/fetch/$s_!xw4p!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png 848w, https://substackcdn.com/image/fetch/$s_!xw4p!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png 1272w, https://substackcdn.com/image/fetch/$s_!xw4p!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa9e64ed3-cb14-4c4b-aa7b-255e996ec58d_700x1058.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>They offer a rich agents gallery. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!YHwZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!YHwZ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png 424w, https://substackcdn.com/image/fetch/$s_!YHwZ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png 848w, https://substackcdn.com/image/fetch/$s_!YHwZ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png 1272w, https://substackcdn.com/image/fetch/$s_!YHwZ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!YHwZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png" width="1322" height="893" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:893,&quot;width&quot;:1322,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!YHwZ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png 424w, https://substackcdn.com/image/fetch/$s_!YHwZ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png 848w, https://substackcdn.com/image/fetch/$s_!YHwZ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png 1272w, https://substackcdn.com/image/fetch/$s_!YHwZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fec95a1c9-5d86-48de-bdf0-fefb2cdb80b7_1322x893.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>In concept, this amounts to a simplified, less technical version of building your own research agent with Claude Code/ <a href="https://github.com/drpedapati/sciclaw">sciclaw</a> : all the tools are connected automatically, requiring minimal setup.</p><p>The trade-off is cost &#8212; SciSpace charges by credit usage &#8212; and the fact that for all its versatility, it is unproven that this breadth actually delivers better results than more focused alternatives. SciSpace occupies a middle ground between the full flexibility of a DIY setup like Claude Code and the guided experience of platforms like Undermind and Elicit, which raises the question of whether that middle ground has a natural audience.  </p><p>In terms of the &#8220;invisible menu&#8221; issue, again this is mid-way between a system like Undermind Projects and complete DIY setup like Claude Code, since you get your hands dirty more than the former but less than the latter, giving you immediate understanding of the agentic flows.</p><div class="captioned-button-wrap" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/from-fixed-search-workflows-to-agentic?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="CaptionedButtonToDOM"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! This post is public so feel free to share it.</p></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/from-fixed-search-workflows-to-agentic?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/p/from-fixed-search-workflows-to-agentic?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p></div><p></p><h2>Conclusion</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7SFa!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7SFa!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png 424w, https://substackcdn.com/image/fetch/$s_!7SFa!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png 848w, https://substackcdn.com/image/fetch/$s_!7SFa!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png 1272w, https://substackcdn.com/image/fetch/$s_!7SFa!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7SFa!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png" width="1203" height="671" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/da470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:671,&quot;width&quot;:1203,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1046211,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7SFa!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png 424w, https://substackcdn.com/image/fetch/$s_!7SFa!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png 848w, https://substackcdn.com/image/fetch/$s_!7SFa!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png 1272w, https://substackcdn.com/image/fetch/$s_!7SFa!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fda470b4b-b591-40b6-82f8-6b135f26ddd0_1203x671.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The academic search landscape may be shifting from rigid, predetermined workflows towards more flexible agentic architectures. Elicit&#8217;s Research Agents, Undermind&#8217;s Projects feature, and SciSpace Agents each represent different points on this spectrum, but they all reflect the same underlying recognition: LLMs are now capable enough to reason across tools rather than merely execute a fixed pipeline.</p><p>Yet as my testing reveals, &#8220;more agentic&#8221; does not automatically mean &#8220;more usable.&#8221;  When a system can theoretically do anything, the user bears the cognitive burden of figuring out what it can actually do, which tools it will invoke, and how to phrase requests to get the desired outcome. The Undermind example is telling: even a power user (me!) needed developer tips to use the system efficiently. That does not look like a sustainable model for broader adoption.</p><p>As I discussed earlier, vendors are hedging their bets &#8212; offering MCP connectors while simultaneously layering agentic capabilities onto their own platforms, and libraries are beginning to wire up LLMs directly to their collections. Where this leaves the middle ground is uncertain. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Rd0M!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Rd0M!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png 424w, https://substackcdn.com/image/fetch/$s_!Rd0M!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png 848w, https://substackcdn.com/image/fetch/$s_!Rd0M!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png 1272w, https://substackcdn.com/image/fetch/$s_!Rd0M!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Rd0M!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png" width="1204" height="677" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:677,&quot;width&quot;:1204,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1126734,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Rd0M!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png 424w, https://substackcdn.com/image/fetch/$s_!Rd0M!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png 848w, https://substackcdn.com/image/fetch/$s_!Rd0M!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png 1272w, https://substackcdn.com/image/fetch/$s_!Rd0M!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F922eb751-be87-48ac-844f-c5dde67237ba_1204x677.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>My suspicion is that a general-purpose agentic platform for research, such as SciSpace Agents, will struggle to find a big audience. Technical early adopters will build their own workflows with Claude Code or similar tools like Sciclaw. Less technical users will gravitate towards familiar interfaces like Claude or ChatGPT with a few MCP connectors attached, or towards focused platforms like Undermind and Elicit that guide them through the process. One key question for vendors is not just whether to become more agentic, but how to do so without making their tools harder to use</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mGFR!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mGFR!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png 424w, https://substackcdn.com/image/fetch/$s_!mGFR!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png 848w, https://substackcdn.com/image/fetch/$s_!mGFR!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png 1272w, https://substackcdn.com/image/fetch/$s_!mGFR!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mGFR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png" width="1211" height="703" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:703,&quot;width&quot;:1211,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:762067,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/193754360?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mGFR!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png 424w, https://substackcdn.com/image/fetch/$s_!mGFR!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png 848w, https://substackcdn.com/image/fetch/$s_!mGFR!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png 1272w, https://substackcdn.com/image/fetch/$s_!mGFR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd602d2d5-1461-4c15-8bd6-47cd6f2dfaf0_1211x703.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>What seems clear, at least from these examples, is that some tools are moving past the &#8216;horseless carriage&#8217; stage I described in my previous post. The conversation has moved beyond simply bolting LLMs onto legacy search paradigms. </p><p>If the above is correct, a major challenge now is designing agentic systems that are genuinely discoverable &#8212; where users can understand what the system is capable of without needing insider knowledge or developer access. Until that challenge is addressed, much of the promise of agentic academic search is likely to remain concentrated among users willing to tinker.</p><p>I have been thinking about what it would take to overcome the invisible menu problem &#8212; what kinds of affordances, documentation, and design patterns could help users navigate these systems more effectively. I hope to explore that in a future post.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi</span></a></p><p></p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>As I noted <a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">in an earlier post</a>, the term agent is extremely disputed. But typically it means LLMs autonomously using tools in a loop.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>Generally, if the system can pass the test at least once, I consider it a pass. It is also possible the system does not actually do the proper steps and just gets papers that were not referenced by pure luck.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-3" href="#footnote-anchor-3" class="footnote-number" contenteditable="false" target="_self">3</a><div class="footnote-content"><p>The original SciSpace Deep Review and search is still available as a tool to the agent. But if you want to ignore the agentic search you can<a href="https://scispace.com/search"> click on &#8220;literature review&#8221; </a>on the left pane to go back to the original SciSpace search</p></div></div>]]></content:encoded></item><item><title><![CDATA[The Horseless Carriage of AI Search: Why Using LLMs to Generate Boolean Alone Is Likely of Little Benefit]]></title><description><![CDATA[Not exactly saying Boolean must die.....but... maybe less focus?]]></description><link>https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search</link><guid isPermaLink="false">https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Sat, 21 Mar 2026 06:23:47 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!WSYd!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!WSYd!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!WSYd!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!WSYd!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!WSYd!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!WSYd!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!WSYd!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png" width="1456" height="813" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:813,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:7447623,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!WSYd!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!WSYd!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!WSYd!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!WSYd!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe5695c4b-edab-48e0-8d9e-1521f10ebfac_2752x1536.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><strong>TL;DR:</strong> Turning natural language into Boolean is not the future of library AI search. It can help with some failed queries, but the bigger problem in most discovery systems is weak ranking, not the need for better Boolean. More radically, I conclude by arguing Boolean itself may no longer be the right foundation for retrieval in an era of BM25 (loose/fuzzy boolean), hybrid search, and agentic search.</p><p>There is a growing trend among library vendors and AI search startups to use LLMs to convert natural language queries into Boolean search strings (dubbed LLM-to-Boolean from now on). Examples that use this method as part or whole of their retrieval pipeline include <a href="https://katinamagazine.org/content/article/reviews/2025/deep-dive-into-three-ai-academic-search-tools">Scopus AI, Web of Science Research Assistant</a>, <a href="https://aarontay.substack.com/p/a-deep-dive-into-ebscohosts-natural-4a6">Web of Science Smart Searc</a>h, <a href="https://katinamagazine.org/content/article/reviews/2025/deep-dive-into-three-ai-academic-search-tools">Primo Research Assistant</a>, <a href="https://knowledge.exlibrisgroup.com/Summon/Product_Documentation/Searching_in_The_Summon_Service/Search_Features/Getting_Started_with_Summon_Research_Assistant">Summon Research Assistant</a>, <a href="https://aarontay.substack.com/p/a-deep-dive-into-ebscohosts-natural">EBSCOhost Natural Language Search</a>,<a href="https://scite.ai/assistant"> Scite.ai Assistant</a>, and many more. Universities are also building their own versions, such as <a href="https://search.library.stonybrook.edu/discovery/search?vid=01SUNY_STB:01SUNY_STB">Stony Brook University&#8217;s SEARCH AI</a> and <a href="https://library2.sdsu.edu/onesearch/ai/">San Diego State University&#8217;s OneSearch AI Assistant.</a></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Z1xo!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Z1xo!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!Z1xo!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!Z1xo!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!Z1xo!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Z1xo!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:8697319,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Z1xo!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!Z1xo!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!Z1xo!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!Z1xo!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ca7cd1b-9fc5-4dcb-8644-fd5b93c660b4_2816x1536.png 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>With this many vendors and institutions converging on the same approach, you might reasonably assume this is what &#8220;AI-powered search&#8221; means &#8212; that this is the important innovation, perhaps even the whole story of how AI will transform library search.</p><p>It is not. Not even close. Using an LLM to convert natural language to Boolean may be the horseless carriage of AI-powered search<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a>. When the automobile was invented, the first instinct was to build something that looked like a horse-drawn carriage but with a motor bolted on. It took years before designers realised that the new technology demanded a fundamentally different form. LLM-to-Boolean is the same kind of thinking: it takes the most powerful text-understanding technology ever built and uses it to produce the exact same artefact &#8212; a Boolean query string &#8212; that librarians have been crafting by hand for decades. In the simplest implementations, the LLM is mainly a more elaborate query-construction layer placed in front of an otherwise conventional lexical search engine.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!tBQc!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!tBQc!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png 424w, https://substackcdn.com/image/fetch/$s_!tBQc!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png 848w, https://substackcdn.com/image/fetch/$s_!tBQc!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png 1272w, https://substackcdn.com/image/fetch/$s_!tBQc!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!tBQc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png" width="1199" height="677" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:677,&quot;width&quot;:1199,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1298764,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!tBQc!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png 424w, https://substackcdn.com/image/fetch/$s_!tBQc!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png 848w, https://substackcdn.com/image/fetch/$s_!tBQc!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png 1272w, https://substackcdn.com/image/fetch/$s_!tBQc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb8afb14a-57ea-4984-a655-a4bab3aeeb65_1199x677.png 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I am not saying this approach has zero value. For a novice user who types a full sentence into a strict Boolean search engine and gets zero results, having an LLM translate that into a workable query is a real improvement. But used alone &#8212; without modern reranking (e.g. neural ranking, embedding retrieval methods, or agentic search) &#8212; I am skeptical LLM-to-Boolean does much to improve result quality for most users<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>. It is important for vendors and librarians to realise this is not the main event, rather it is a minor supporting act.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi</span></a></p><p></p><h2>Retrieval versus ranking: the distinction that matters</h2><p>If we are serious about improving search in library discovery systems, we need to stop tinkering with query construction alone and start addressing the real bottleneck: what happens after retrieval.</p><p>Information retrieval teaches that search engines do two things: they retrieve documents (deciding which ones make it into the result set) and they rank those documents (deciding the order you see them in). These are distinct stages, and improvements to one do not automatically improve the other.</p><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!n7E0!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!n7E0!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png 424w, https://substackcdn.com/image/fetch/$s_!n7E0!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png 848w, https://substackcdn.com/image/fetch/$s_!n7E0!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png 1272w, https://substackcdn.com/image/fetch/$s_!n7E0!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!n7E0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png" width="776" height="437" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/faba3f54-9769-4864-9803-faa9341655e2_776x437.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:437,&quot;width&quot;:776,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:475774,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!n7E0!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png 424w, https://substackcdn.com/image/fetch/$s_!n7E0!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png 848w, https://substackcdn.com/image/fetch/$s_!n7E0!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png 1272w, https://substackcdn.com/image/fetch/$s_!n7E0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffaba3f54-9769-4864-9803-faa9341655e2_776x437.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Boolean only retrieves a candidate set of results. Strictly speaking, every document that matches the Boolean logic is treated as equally relevant. Ranking &#8212; typically based on <a href="https://opensourceconnections.com/blog/2015/10/16/bm25-the-next-generation-of-lucene-relevation/">lexical relevance functions like TF-IDF (term frequency - inverse document frequency) or its more sophisticated successor BM25</a> &#8212; is what determines the order you actually see results in. Most library search systems already have both stages, even if the ranking layer is not always well documented. </p><p>Most library or academic search systems rely heavily on lexical retrieval and lexical/proprietary relevance ranking that are TF-IDF/BM25-like based on a combination of term frequency, document frequency, document normalization and field weighting with some additional weighting for citation counts.</p><blockquote><p><a href="https://service.elsevier.com/app/answers/detail/a_id/14182/supporthub/scopus/kw/wildcard/">Scopus for example mentions</a> - &#8220;The more often a term occurs in a document, the more likely that it is relevant to the topic of the article&#8221; and &#8220;Not every word is equally important. A term that occurs in nearly all documents will score less than something unusual. We use calculations based on Term Frequency/Inverse. Scopus uses Document Frequency (TF/IDF) (a concept originally introduced by Karen Sp&#228;rck Jones, 1972) to assign a weight to any particular word in any collection of documents&#8221; </p></blockquote><p>LLM-to-Boolean is entirely focused on the retrieval stage. It changes which documents get retrieved, which matters. But it does nothing to upgrade the ranking stage &#8212; the part that determines whether the best results appear on your first page or are buried on page five. In an era when users routinely face thousands of results, ranking is what determines what they actually see.</p><p>The problem is that BM25, which underpins ranking in most library databases, is decades-old technology<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-3" href="#footnote-3" target="_self">3</a>. It scores relevance by counting how often your search terms appear in a document and how rare those terms are across the corpus. It has no understanding of meaning, context, or user intent.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe now&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/subscribe?"><span>Subscribe now</span></a></p><p></p><h2>Who does LLM-generated Boolean actually help?</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!UFcy!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!UFcy!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png 424w, https://substackcdn.com/image/fetch/$s_!UFcy!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png 848w, https://substackcdn.com/image/fetch/$s_!UFcy!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png 1272w, https://substackcdn.com/image/fetch/$s_!UFcy!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!UFcy!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png" width="1190" height="665" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:665,&quot;width&quot;:1190,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1202184,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!UFcy!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png 424w, https://substackcdn.com/image/fetch/$s_!UFcy!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png 848w, https://substackcdn.com/image/fetch/$s_!UFcy!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png 1272w, https://substackcdn.com/image/fetch/$s_!UFcy!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9a09e2eb-cd0e-4f99-b016-c6c8e3dd10ba_1190x665.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>There are broadly three types of users to consider.</p><p>Novice users have the following failure modes.</p><p>Too aggressive with keywords &#8212; ANDing too many specific terms, getting zero results. LLMs to boolean might help here with adding synonyms though in my experience this doesn&#8217;t help because the user often has just too strict a search.</p><p>Too broad query&#8212; single or too general term, overwhelmed by thousands of results. LLM-to-Boolean may actually make this worse by adding synonyms that broaden the set further. What this user needs is better ranking not more synonyms.</p><p>Natural language as query &#8212; users thinking they are working with a natural language search systems and typing a full question, getting zero or bizarre results because the system matches &#8220;what,&#8221; &#8220;is,&#8221; &#8220;the&#8221; literally. LLM-to-Boolean helps here by parsing the question into workable Boolean.</p><p>For the increasing number of users who expect natural language search and get zero results because the system cannot parse their sentence, LLM-to-Boolean is a genuine improvement over nothing. But this is a relatively narrow use case: even without this many users quickly adjust and switch to keywords when they notice zero results.</p><p>Expert searchers who construct systematic review search strategies. These users gain nothing. They build lengthy, carefully piloted Boolean strategies using controlled vocabulary and proximity operators. As of 2026, LLM-based Boolean generation is still not reliable enough to replace expert searchers, although recent benchmark work &#8212; notably the <a href="https://arxiv.org/pdf/2602.00005">AutoBool project using reinforcement learning</a> &#8212; has narrowed the gap on some datasets. LLMs can be useful for brainstorming, but they cannot serve as an automated replacement. Expert searchers are not going to benefit from an LLM doing what they already do, and doing it less reliably<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-4" href="#footnote-4" target="_self">4</a>.</p><p>Users who type in reasonably simple keywords. This is the largest group and the one that matters most &#8212; researchers looking for relevant literature, students doing coursework, information literacy librarians conducting narrative reviews. </p><p>This group either types in 3-5 reasonable keywords or construct simpler nested Boolean versions of (A OR B) AND (C OR D) used by systematic review searchers.</p><p>Many of these users do not have a retrieval problem: their keywords already retrieve relevant documents. They have a ranking problem. The relevant documents are in the result set but buried beneath less relevant ones. What they need is not a fancier query; they need the search engine to put the best results at the top. LLM-to-Boolean does nothing about this &#8212; and, as I will argue, can actually make things worse.</p><h2>The synonym expansion problem</h2><p>To understand how LLM-to-Boolean can degrade results for that third group, we need to look at what it actually does to a query.</p><p>When an LLM converts a natural language query to Boolean, it almost always adds a large number of synonyms. Strip away the marketing language and what the LLM is doing &#8212; beyond dropping stop words and extracting key concepts &#8212; is essentially query expansion: transforming a user&#8217;s simple keywords into nested Boolean strings with multiple OR&#8217;d synonyms per concept<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-5" href="#footnote-5" target="_self">5</a>.</p><p>Query expansion is not new<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-6" href="#footnote-6" target="_self">6</a>. It can improve recall by retrieving more potentially relevant documents. But it also injects noise by retrieving many more marginal or incidental matches. Whether that trade-off is worthwhile depends entirely on whether the synonyms added fit the searcher intent exactly and whether the search system has a strong enough ranking layer to separate signal from noise.</p><p>In the next section, I provide three separate arguments on why when LLMs generate Boolean from query inputs, they do not necessarily improve things.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!aMOY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!aMOY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png 424w, https://substackcdn.com/image/fetch/$s_!aMOY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png 848w, https://substackcdn.com/image/fetch/$s_!aMOY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png 1272w, https://substackcdn.com/image/fetch/$s_!aMOY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!aMOY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png" width="776" height="433" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:433,&quot;width&quot;:776,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:657631,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!aMOY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png 424w, https://substackcdn.com/image/fetch/$s_!aMOY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png 848w, https://substackcdn.com/image/fetch/$s_!aMOY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png 1272w, https://substackcdn.com/image/fetch/$s_!aMOY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F38f62876-f9c6-49c4-8844-9d992f3dd389_776x433.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h3>Argument 1 : Nested Boolean is a search paradigm that is no longer useful in today&#8217;s search environment</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!HOMb!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!HOMb!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!HOMb!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!HOMb!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!HOMb!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!HOMb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:8874657,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!HOMb!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!HOMb!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!HOMb!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!HOMb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fba38cc6e-7871-420e-9465-dc4c2508ba25_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><a href="https://musingsaboutlibrarianship.blogspot.com/2014/07/why-nested-boolean-search-statements.html">I argued as early as 2014, well before the emergence of LLMs, that nested Boolean searching had become far less effective in many modern search environments and use cases (outside of evidence synthesis).</a> The traditional nested Boolean strategy, decomposing a topic into concepts, enumerating synonyms for each, and combining them in the form <code>(A1 OR A2 OR A3) AND (B1 OR B2 OR B3)</code>, was developed for a very different retrieval context: one characterised by limited full-text coverage, relatively small databases, and a significant risk of zero results. Under those conditions, extensive synonym expansion was often both rational and necessary.</p><p>Contemporary search environments differ markedly. Full-text indexing is now widespread, collections routinely contain hundreds of millions of records, and stemming or related linguistic normalisation techniques handle many lexical variants automatically. In such contexts, straightforward keyword searches already tend to achieve acceptable recall and the focus is on precision. Adding long lists of OR-connected terms therefore often produces an explosion of incidental matches. A monograph that mentions &#8220;cardiac event&#8221; once in passing on page 247 may enter the result set alongside a systematic review centrally concerned with the topic<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-7" href="#footnote-7" target="_self">7</a>. Even in systems without full-text search, the average query now tends to retrieve far more material than in the past, which strengthens the case for improved ranking rather than more aggressive expansion.</p><h3>Argument 2 : LLM&#8217;s today add poor synonyms that create more noise and over-stress outdated relevance ranking systems</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!vfMq!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!vfMq!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!vfMq!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!vfMq!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!vfMq!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!vfMq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:8521797,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!vfMq!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!vfMq!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!vfMq!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!vfMq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23b3dff1-bdc1-4afc-8978-bea831ddc0c1_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>LLM-to-Boolean systems amplify this longstanding problem. Worse still, inspection of Boolean strings generated by current systems, especially those relying on lower-cost bundled models such as GPT-4o mini in products such as Primo Research Assistant, suggests that the generated synonyms are often of uneven quality. They may include loosely related terms, overly broad variants, or, in some cases, plainly inappropriate substitutions. Each additional weak term expands the candidate set while simultaneously increasing the proportion of noise within it.</p><p>The central mechanism is straightforward. Query expansion may assist strict Boolean retrieval by increasing the number of documents admitted into the result set, but it can also impair relevance ranking under models such as TF-IDF and BM25 by diluting the discriminative value of the user&#8217;s original terms. Once a query is expanded from a small number of strong keywords into multiple concepts populated by weaker synonyms, the ranking function may assign undue weight to documents matching several marginal variants. As a result, documents that align only loosely with the user&#8217;s actual intent may be ranked above those that match it more precisely. Because many library discovery systems combine Boolean retrieval with TF-IDF or BM25-style ranking, LLM-generated synonym expansion can improve one stage of the retrieval process, at least in the narrow sense of increasing potential recall, while simultaneously degrading another. In the absence of a sufficiently strong reranking layer, the result is not simply a larger result set, but a larger and less coherent one.</p><h3>Argument 3 : There are search resistant concepts where it is better NOT to represent in the Boolean Search</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!6zve!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!6zve!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!6zve!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!6zve!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!6zve!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!6zve!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:8657273,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!6zve!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!6zve!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!6zve!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!6zve!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2c3d85-e92f-4190-90ce-2fd5e61f7927_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>There is also a further complication. Sometimes, somewhat counter-intuitively, trying to represent hard-to-search concepts, what <a href="https://farhadinfo.medium.com/stop-searching-and-you-will-find-it-search-resistant-concepts-in-systematic-searching-c7968ddf22c8">Farhad Shokraneh calls </a><em><a href="https://farhadinfo.medium.com/stop-searching-and-you-will-find-it-search-resistant-concepts-in-systematic-searching-c7968ddf22c8">search-resistant concepts</a></em>, is a mistake. The reason is simple: if you do not know the right terms, forcing them into the query can exclude many relevant papers. In some cases, trying to be more precise actually makes the search worse. A good example is PICO-based searching. Outcome terms are often expressed in highly variable, non-standardised ways, so it is often better not to filter for outcomes at all, and instead accept a larger set for later screening. Do LLMs that expand searches recognise this distinction? </p><p>While evidence synthesis librarians are more willing to look through 100% of results in a much bigger set of results, most other users will not look through every result and here again the potential of a much stronger ranker is where most of the value &#8220;AI search&#8221; brings.</p><h2>PubMed: what good query expansion looks like</h2><p>Compare LLM-generated synonyms to a system that does query expansion well: PubMed. PubMed&#8217;s Automatic Term Mapping (ATM) also expands user queries with additional terms, but the quality difference is vast<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-8" href="#footnote-8" target="_self">8</a>.</p><p>Among other things, ATM maps user terms to MeSH (Medical Subject Headings) &#8212; a carefully curated, hierarchically structured controlled vocabulary maintained by domain experts over decades. When ATM expands "heart attack" to include "myocardial infarction," it draws on a tested thesaurus. When an LLM expands "heart attack" to include "cardiac event," "chest pain," and "cardiovascular incident," it generates plausible-sounding terms with no guarantee they map to the same concept.</p><p>PubMed also has architectural advantages. Its users often prioritise recall over precision, making aggressive expansion a more defensible trade-off. It searches citation and abstract records plus MeSH metadata but not full text, making every keyword match less likely to be incidental. It covers a well-defined domain (life sciences), reducing the risk that added terms have multiple unrelated meanings.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!FLTu!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!FLTu!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png 424w, https://substackcdn.com/image/fetch/$s_!FLTu!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png 848w, https://substackcdn.com/image/fetch/$s_!FLTu!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png 1272w, https://substackcdn.com/image/fetch/$s_!FLTu!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!FLTu!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png" width="757" height="429" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:429,&quot;width&quot;:757,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:491853,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!FLTu!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png 424w, https://substackcdn.com/image/fetch/$s_!FLTu!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png 848w, https://substackcdn.com/image/fetch/$s_!FLTu!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png 1272w, https://substackcdn.com/image/fetch/$s_!FLTu!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F08db5dd8-f23d-4a11-81c3-39705182bd81_757x429.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Most critically, PubMed has a superior ranking system. It uses a two-stage architecture with LambdaMART reranking on the top 500 results &#8212; far more sophisticated than generic BM25. So even when ATM broadens the result set, the reranking step ensures the most relevant documents rise to the top. The expansion and the reranking work together as a system. This is precisely the architecture most library databases search lack.</p><h2>What does the empirical evidence say?</h2><p>Among the systems which use LLM to convert input to Boolean, Primo Research Assistant is probably the most well studied. </p><p>One of the more rigorous studies is Galbreath et al. (2025), which evaluated Ex Libris&#8217; Primo Research Assistant (PRA), which at the time of study was using GPT-3.5 to convert natural language into Boolean &#8212; against Boolean searches crafted by instruction librarians at Washington State University.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!u2V0!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!u2V0!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png 424w, https://substackcdn.com/image/fetch/$s_!u2V0!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png 848w, https://substackcdn.com/image/fetch/$s_!u2V0!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png 1272w, https://substackcdn.com/image/fetch/$s_!u2V0!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!u2V0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png" width="1205" height="667" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ab051f92-c79f-4b64-9537-7866e3def120_1205x667.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:667,&quot;width&quot;:1205,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1097919,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!u2V0!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png 424w, https://substackcdn.com/image/fetch/$s_!u2V0!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png 848w, https://substackcdn.com/image/fetch/$s_!u2V0!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png 1272w, https://substackcdn.com/image/fetch/$s_!u2V0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab051f92-c79f-4b64-9537-7866e3def120_1205x667.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>The headline finding: no appreciable difference in topical relevance. PRA returned relevant sources 46.3 per cent of the time; librarian-built searches returned 45.6 per cent. I was mildly surprised at first at the results. But this result needs careful reading.</p><p>For each query, Primo Research Assistant generates ten Boolean variant strings runs the search and the top five are then sent to the LLM for summary generation.</p><p>Because Primo Research Assistant only generates answers using retrieval augmented generation based on the top 5 ranked results, it is critical the relevant results make it to the top 5 which requires a very strong relevance ranking system.</p><p>Perhaps this is why PRA does more than pure LLM-to-Boolean, but adds an additional reranking step beyond the usual Primo relevance ranking. <em>It retrieves the top thirty matching records using the usual method and then reranks them using vector embeddings (semantic ranking).</em></p><p>Even though reranking the top 30 still is a relatively modest effort (many state of art systems will rerank the top 100!), and the semantic reranking will still fail if the conventional ranking fails to get relevant results in the top 30, it still helps a lot.</p><p>You can actually roughly compare how results in the top 5 would look like without the reranking steps<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-9" href="#footnote-9" target="_self">9</a>. I have done some comparisons and while I am not the most impressed with Primo Research Assistant relevancy ranking even with the reranking step , the results would be far worse without it!</p><p>The other issue is the sample of queries used. The study used zero-result patron queries &#8212; queries where users had typed natural language into Primo and received nothing back. These are precisely the cases where LLM-to-Boolean provides the clearest benefit. The results might look very different for the much larger population of queries that already return results.</p><p>More importantly, I have a strong suspicion, the queries tested were mostly &#8220;easy&#8221; queries with many potential relevant matches. This is most telling with the lack of overlap in results between the items retrieved from librarian searches and PRA searches. </p><p>Despite both sets achieving roughly 50% precision<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-10" href="#footnote-10" target="_self">10</a>, only 7.21 per cent of PRA's citations matched the expert searches' results. Clearly, there were many relevant results and PRA was not finding better results; it was finding different results of comparable quality.</p><p>In short, the queries were not &#8220;skill-testing&#8221;, harder queries with a much smaller and limited set of relevant results would no doubt stress Primo Research Assistant even more and this is where I see systems with more powerful relevancy ranking capabilities that goes beyond simple lexical ranking like Elicit.com, Undermind.ai, Consensus shine.</p><h2>Not all LLM-to-Boolean tools are equal</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!aBrp!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!aBrp!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png 424w, https://substackcdn.com/image/fetch/$s_!aBrp!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png 848w, https://substackcdn.com/image/fetch/$s_!aBrp!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png 1272w, https://substackcdn.com/image/fetch/$s_!aBrp!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!aBrp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png" width="1456" height="492" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:492,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:4928048,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!aBrp!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png 424w, https://substackcdn.com/image/fetch/$s_!aBrp!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png 848w, https://substackcdn.com/image/fetch/$s_!aBrp!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png 1272w, https://substackcdn.com/image/fetch/$s_!aBrp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72dd5019-3ddc-4c55-96b9-4431ad2a443b_3504x1184.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The tools I listed at the outset sit on a spectrum, and the differences matter.</p><p>At one end, Web of Science Research Assistant (as tested in early 2025) and EBSCOhost NLS are pure LLM-to-Boolean: they generate a Boolean query and run it against the standard index with no changes to ranking. The homebrew implementations from Stony Brook and San Diego State work similarly<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-11" href="#footnote-11" target="_self">11</a>. </p><p>In the middle, as we have seen - Primo Research Assistant generates Boolean, retrieves the top 30 results, then reranks them using embeddings. Web of Science Smart Search runs Boolean and semantic search together and lets users toggle between combined, Boolean-only, and semantic-only results. (Do not confuse Web of Science Smart Search with Web of Science Research Assistant &#8212; the former is bundled with no RAG; the latter is a paid add-on with RAG.)</p><p>At the other end, Scopus AI describes a hybrid architecture in which it may use vector search, keyword search, or both depending on the query, combining and reranking the results.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!atRx!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!atRx!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 424w, https://substackcdn.com/image/fetch/$s_!atRx!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 848w, https://substackcdn.com/image/fetch/$s_!atRx!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 1272w, https://substackcdn.com/image/fetch/$s_!atRx!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!atRx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png" width="1125" height="346" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:346,&quot;width&quot;:1125,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!atRx!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 424w, https://substackcdn.com/image/fetch/$s_!atRx!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 848w, https://substackcdn.com/image/fetch/$s_!atRx!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 1272w, https://substackcdn.com/image/fetch/$s_!atRx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Once you lay out this spectrum, you can make a prediction: tools that go beyond LLM-to-Boolean alone &#8212; those adding hybrid search, dense embedding reranking &#8212; should typically outperform those that do not and be favoured by serious researchers. And roughly speaking, this is what I found in my informal comparative testing and<a href="https://katinamagazine.org/search?option1=fulltext&amp;value1=%22aaron+tay%22"> in various Katina reviews.</a></p><blockquote><p>So far, we have being discussing &#8220;quick search&#8221;, where results are returned with very little delay (e.g. &lt; 1 min). Agentic/deep search, which uses the LLMs to do iterative searching and evaluation gives you much superior results but you will have to wait much longer (e.g. &gt;10 minutes) for the results. I dub this the difference between <a href="https://aarontay.substack.com/p/why-i-think-academic-deep-research">Deep Search/Research tools vs &#8220;Quick Search&#8221;.</a></p></blockquote><p><a href="https://aarontay.substack.com/p/the-reproducibility-and">The LLM-to-Boolean approach does have one genuine strength: interpretability. </a>When the system displays the generated Boolean, you can inspect it, critique it, modify it, and rerun it. That transparency in the retrieval stage is worth acknowledging. But it comes at the cost of reproducibility: because an LLM generates the query, the search strategy can change each time you run it.<a href="https://katinamagazine.org/content/article/reviews/2025/deep-dive-into-three-ai-academic-search-tools"> In my testing, Web of Science Research Assistant and Primo Research Assistant generated different Boolean strings roughly one in five times; Scopus AI changed nearly every other time.</a></p><h2>Why our profession's focus on Boolean retrieval is understandable but limiting</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!rSbM!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!rSbM!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!rSbM!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!rSbM!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!rSbM!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!rSbM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/dad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:8671563,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!rSbM!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!rSbM!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!rSbM!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!rSbM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdad26933-5ec4-4f2c-86a0-f417454ccbdd_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Library training and practice have always centred on the retrieval side of search &#8212; constructing the right query to get the right documents into the result set. That is what we teach, what we are trained in, and where our expertise lies. Ranking &#8212; what happens after retrieval &#8212; has historically been the vendor&#8217;s domain, largely invisible to us and outside our direct control.</p><p>This is not a failing of individual librarians. It is a structural feature of how the profession developed. When library catalogues used strict Boolean with no relevance ranking at all &#8212; results sorted by accession number or date &#8212; retrieval was genuinely the whole game. Getting documents into the result set was the only thing you could influence. Evidence Synthesis Librarians obviously have the same mindset as they typically intend to screen all the retrieved results. The habits, pedagogy, and professional identity that developed around this reality are deeply embedded and entirely rational given that history.</p><p>But the search environment has changed. Users now routinely face thousands of results and scan only the first few pages. In that context, ranking determines what users actually encounter. The professional focus on retrieval, while understandable, has become a blind spot &#8212; and it shapes which AI innovations we notice and which we overlook.</p><p>LLM-to-Boolean is visible, inspectable, and maps directly onto existing expertise. It fits neatly into teaching practices and workflows. It is unsurprising that it has generated more enthusiasm than semantic reranking, which operates invisibly beneath the interface. But we need to be honest that familiarity is not the same as effectiveness. Our experience with Google and Google Scholar teaches us that users overwhelmingly judge search engines by the quality of what appears on the first page, not by whether they can inspect the query logic. A search you can fully explain but that returns mediocre results will be rejected in favour of one that is harder to explain but returns excellent results.</p><p>To be fair, since I started in the profession in 2007, I have seen a lesser focus on teaching Boolean by librarians, but the rise of &#8220;AI search&#8221; may accidently push this back to the agenda&#8230;.</p><h2>Vendors have their own motivation to create the narrative LLM to Boolean = AI search</h2><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Azm3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Azm3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!Azm3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!Azm3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!Azm3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Azm3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/dcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:9296100,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Azm3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!Azm3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!Azm3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!Azm3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdcc9891e-eef9-41de-96d4-27db1ef51d33_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Existing database vendors, for their part, have their own reasons for staying with lexical methods and they have to do with cost. Boolean retrieval over inverted indexes is fast, well understood, and already built. The infrastructure exists and is paid for. Bolting an LLM onto the front end to generate Boolean queries requires no changes to the underlying index, no new data pipelines, and no reindexing of billions of records. It is, from an engineering and business perspective, the cheapest possible way so say you are doing "AI",  especially if you bolt on the cheapest LLM you can find<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-12" href="#footnote-12" target="_self">12</a>.</p><p>Moving to dense embeddings is a different proposition entirely. It requires generating vector representations for every document in the index<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-13" href="#footnote-13" target="_self">13</a>. At the scale of a system like Ex Libris CDI, with over five billion records, that is a significant computational investment &#8212; not just a one-off cost but an ongoing one, since embeddings need to be regenerated whenever the model is updated or new documents are ingested. Dense retrieval is also slower than inverted index lookup at query time, particularly without heavy optimisation of approximate nearest neighbour search infrastructure.  </p><p>Cross-encoder reranking or using LLMs directly for ranking, the most powerful option for second-stage ranking, is more expensive still. A cross-encoder scores each query-document pair individually, which means running the model once for every candidate document. Even reranking just the top 500 results per query, at the scale of millions of daily searches, adds up. Vendors looking at these numbers can easily conclude that the return on investment is uncertain &#8212; especially when librarians are not asking for it and seem satisfied with LLM-to-Boolean.</p><blockquote><p>The next level beyond these methods would be employing agentic/deep search, which uses the LLMs to do iterative searching and evaluation -  you get much superior results but at the cost of latency<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-14" href="#footnote-14" target="_self">14</a>.</p></blockquote><p>This creates a reinforcing cycle. Librarians ask for LLM to Boolean retrieval because that is where their expertise lies. Legacy Vendors invest in LLM-to-Boolean because it is cheap to implement and aligns with what librarians are asking for. Neither side pushes for the harder, more expensive, but ultimately more impactful investment in ranking. The result is that library search systems remain stuck with decades-old ranking technology while vendors market a superficial AI layer on top as though it were transformative.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!h4jP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!h4jP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!h4jP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!h4jP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!h4jP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!h4jP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/df4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:8529371,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!h4jP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!h4jP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!h4jP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!h4jP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf4b5bff-4a42-4d36-9374-4c90f2b642ba_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p></p><h2>What should AI search do?</h2><p>Let me suggest two approaches</p><h3>1.The more conservative approach to maintain interpretabilty</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Mkfx!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Mkfx!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png 424w, https://substackcdn.com/image/fetch/$s_!Mkfx!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png 848w, https://substackcdn.com/image/fetch/$s_!Mkfx!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png 1272w, https://substackcdn.com/image/fetch/$s_!Mkfx!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Mkfx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png" width="1190" height="667" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:667,&quot;width&quot;:1190,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1146637,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Mkfx!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png 424w, https://substackcdn.com/image/fetch/$s_!Mkfx!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png 848w, https://substackcdn.com/image/fetch/$s_!Mkfx!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png 1272w, https://substackcdn.com/image/fetch/$s_!Mkfx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe77aadbf-44a1-422e-909b-cffd4ec72031_1190x667.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p><strong>Keep Boolean retrieval for the first stage.</strong> Inverted indexes and Boolean logic remain the right tool for scalable initial retrieval. There is no need to abandon this.</p><p>Add modern reranking as a second stage. After Boolean retrieval and BM25 produce a candidate set, apply a &#8220;neural&#8221; reranker &#8212; whether a bi-encoder, cross-encoder, or LLM-based ranker &#8212; to re-sort those candidates before presenting results. This is not radical. <a href="https://arxiv.org/abs/2301.10140">Semantic Scholar uses LightGBM reranking that emphasises title matches and highly-cited recent papers.</a> <a href="https://pmc.ncbi.nlm.nih.gov/articles/PMC6112631/">PubMed uses LambdaMART on the top 500 results. </a>Both are academic search engines at massive scale, and both concluded that BM25 alone was insufficient. Even these comparatively modest reranking techniques, now almost a generation behind the state of the art, produce noticeably better results than BM25 for ranking.</p><p>Some librarians may object that these new usually neural reranking methods are not as interpretable as lexical relevance ranking based on matching query terms. This concern is overblown, for a simple reason: the current system is not that interpretable either<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-15" href="#footnote-15" target="_self">15</a>. </p><p><a href="https://knowledge.exlibrisgroup.com/Primo/Content_Corner/Central_Discovery_Index/Documentation_and_Training/Documentation_and_Training_(English)/CDI_-_The_Central_Discovery_Index/080Search_and_Ranking_in_CDI">The Ex Libris &#8220;Search and Ranking in CDI&#8221; </a>documentation describes a relevance algorithm built on a &#8220;continuously tuned, proprietary&#8221; mix of dynamic rank factors, static rank factors, field boosting, personalised ranking by discipline, and various other components. I would wager that very few librarians who use Primo could explain in detail how CDI&#8217;s current ranking works. We have already accepted opaque ranking (think Google since 2000) &#8212; we just have not acknowledged it<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-16" href="#footnote-16" target="_self">16</a>.</p><p><strong>In return, with Boolean still as a first stage retriever, you get exact hit counts and <a href="https://aarontay.substack.com/p/the-case-of-the-vanishing-hit-count">don&#8217;t run into the problem of hit counts becoming approximate if you use semantic search methods as the first stage retriever.</a></strong></p><h3>2. Giving up interpretability for effectiveness</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!BY3g!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!BY3g!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png 424w, https://substackcdn.com/image/fetch/$s_!BY3g!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png 848w, https://substackcdn.com/image/fetch/$s_!BY3g!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png 1272w, https://substackcdn.com/image/fetch/$s_!BY3g!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!BY3g!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png" width="1194" height="672" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:672,&quot;width&quot;:1194,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1395450,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!BY3g!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png 424w, https://substackcdn.com/image/fetch/$s_!BY3g!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png 848w, https://substackcdn.com/image/fetch/$s_!BY3g!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png 1272w, https://substackcdn.com/image/fetch/$s_!BY3g!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5036bd52-27de-48cf-b7c8-d2993d2c3175_1194x672.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>There is a stronger version of the argument I have been making that I want to put on the table: perhaps we should stop treating Boolean as the obvious choice for first-stage retrieval at all.</p><p>Throughout this post I have advocated a two-stage architecture that keeps Boolean retrieval as the first stage and adds modern reranking as the second. That is a pragmatic position &#8212; it preserves what vendors and librarians are comfortable with while addressing the ranking bottleneck. But pragmatism can obscure a deeper problem. Boolean retrieval is not just outdated at the ranking stage. It is limiting at the retrieval stage too.</p><p>The fundamental issue is that Boolean is binary. A document either matches the query logic or it is excluded entirely. There is no middle ground. If a highly relevant paper uses none of your specified terms or synonyms &#8212; because the authors used different terminology, because the concept is expressed implicitly, or because the relevant discussion appears in a section your metadata fields do not cover &#8212; Boolean will never surface it. It does not matter how good your ranking is downstream. A document that never enters the candidate set cannot be ranked.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!KOBx!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!KOBx!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png 424w, https://substackcdn.com/image/fetch/$s_!KOBx!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png 848w, https://substackcdn.com/image/fetch/$s_!KOBx!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png 1272w, https://substackcdn.com/image/fetch/$s_!KOBx!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!KOBx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png" width="1196" height="664" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:664,&quot;width&quot;:1196,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1024369,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!KOBx!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png 424w, https://substackcdn.com/image/fetch/$s_!KOBx!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png 848w, https://substackcdn.com/image/fetch/$s_!KOBx!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png 1272w, https://substackcdn.com/image/fetch/$s_!KOBx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9c278fd8-3c00-433a-b1c8-667c46887e8b_1196x664.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Having worked with researchers,<em> I can tell you even in areas they know well, they tend to struggle with overly including terms, leading them to put in keywords that end up excluding even known relevant gold standard papers they give me!</em></p><p>The reason for this is that most researchers and even librarians are unfamiliar with what <a href="https://farhadinfo.medium.com/stop-searching-and-you-will-find-it-search-resistant-concepts-in-systematic-searching-c7968ddf22c8">Farhad Shokraneh calls &#8220;search resistant concepts&#8221; which he defines as &#8220;concepts that when added to a the search, are more likely to miss the relevant records.&#8221;</a> In such situations, if you want to ensure high recall, you should not even try to search for the concept!</p><p>He gives three reasons for why concepts are hard to search but the lack of standardised terminology used by the field is the clearest reason.</p><p>In evidence synthesis scenarios, search resistant concepts typically are outcome concepts (from PICO) which are described in so many different ways, such that it is often better not to even try to search for them. Do LLMs know this?  </p><p>This is precisely why LLM-to-Boolean tools resort to aggressive synonym expansion in the first place. The rigidity of Boolean matching creates a constant risk of missing relevant documents, so the system compensates by throwing in every plausible variant. But as I have argued, that expansion then degrades BM25 ranking by flooding the result set with noise. The root cause of both problems &#8212; missed documents and noisy results &#8212; is the same: Boolean&#8217;s binary matching model.</p><p>BM25, used as a first-stage retriever rather than just a ranker, avoids this entirely. BM25 does not hard-exclude documents. It scores every document against the query and returns the top-k by relevance score. A document that matches some but not all of your terms still appears &#8212; it is just ranked lower. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ofLA!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ofLA!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png 424w, https://substackcdn.com/image/fetch/$s_!ofLA!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png 848w, https://substackcdn.com/image/fetch/$s_!ofLA!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png 1272w, https://substackcdn.com/image/fetch/$s_!ofLA!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ofLA!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png" width="1180" height="662" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:662,&quot;width&quot;:1180,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1369802,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ofLA!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png 424w, https://substackcdn.com/image/fetch/$s_!ofLA!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png 848w, https://substackcdn.com/image/fetch/$s_!ofLA!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png 1272w, https://substackcdn.com/image/fetch/$s_!ofLA!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7e3499cd-f45a-4e03-a41b-9cbec3b6e83c_1180x662.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>This means you do not need exhaustive synonym lists to compensate for rigid matching. A simple, well-chosen set of keywords will retrieve a broad and relevant candidate set because partial matches are included rather than discarded. </p><p></p><p> </p><blockquote><h3><strong>BM25 as first-stage retriever versus Boolean: what does this actually mean?</strong></h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!iAB6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!iAB6!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!iAB6!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!iAB6!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!iAB6!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!iAB6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:8251041,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!iAB6!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!iAB6!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!iAB6!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!iAB6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6f35a56-26e5-405d-bf59-f99f35ef9a75_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Using BM25 as a first-stage retriever rather than Boolean can be hard to grasp if you are used to Boolean as the default, so here is a concrete example.</p><p>When you type <code>open access citation advantage</code> into a strict Boolean search engine, most systems today applies an implied AND. Every result must contain all four terms. If a document contains &#8220;open access&#8221; and &#8220;citation&#8221; but not &#8220;advantage,&#8221; it is excluded entirely &#8212; regardless of how relevant it might be.</p><p>A BM25-based retriever works differently. It scores every document based on how well it matches the query terms, weighing term frequency and rarity, but it does not hard-exclude documents that are missing a term. A system using BM25 for first-stage retrieval &#8212; as Google does, or Scite.ai &#8212; might return a document matching only three of your four terms if its overall relevance score is high enough<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-17" href="#footnote-17" target="_self">17</a>. The missing term potentially lowers the score vs documents with all four terms but does not eliminate the document from consideration<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-18" href="#footnote-18" target="_self">18</a>. </p><p>In the information retrieval word, this is still lexical/keyword based as the retrieve and ranking is still just based on term matching<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-19" href="#footnote-19" target="_self">19</a>.</p><p>This matters because strict Boolean can accidentally drop relevant documents through no fault of the searcher. In my review of EBSCOhost Natural Language Search (NLS), I showed an example where I asked the system to find papers that used randomised controlled trials to test for an open access citation advantage. NLS generated a Boolean query and ran it against the index. It failed to surface one of the few obviously relevant papers, despite that paper being indexed in the database. The reason was straightforward: this early paper did not use the phrase &#8220;open access citation advantage,&#8221; and the Boolean that NLS constructed did not expand broadly enough to capture the terminology the paper did use. Under strict Boolean, that single vocabulary mismatch was fatal &#8212; the paper was excluded from the result set entirely.</p><p>A BM25 retriever would not have automatically excluded that paper. It would have scored it lower for missing some query terms, but the paper would still have entered the candidate set. With a strong reranker as a second stage &#8212; one capable of recognising that the paper is conceptually about the same topic even without exact term matches &#8212; that paper could be pushed to the top of the results. Semantic search approaches would handle this even more naturally, since dense embeddings capture conceptual similarity rather than relying on shared vocabulary at all.</p><p>This is the core limitation of Boolean as a retrieval method. It treats term matching as a gate: you are in or you are out. Every term that is missing from the query or absent from the document is a potential point of failure. BM25 and semantic methods treat term matching as a signal &#8212; one input among many into a relevance score &#8212; which is far more forgiving and far less dependent on the searcher anticipating every possible way an author might express a concept.</p></blockquote><p>The aggressive query expansion that causes so many problems under Boolean becomes largely unnecessary. Add a strong reranker on top of first stage BM25 is what all modern post-2019 information retrieval papers use as a strong baseline comparison.</p><p>But if we are willing to give up strict Boolean as first stage, why not go further with either using Semantic search methods alone or as another component at the first stage. Dense embedding retrieval does not depend on term matching at all. It represents both queries and documents as vectors in a shared semantic space and retrieves documents by conceptual similarity. A paper about &#8220;myocardial infarction&#8221; can be retrieved by a query about &#8220;heart attack&#8221; without anyone &#8212; human or LLM &#8212; needing to specify that synonym. The vocabulary mismatch problem that has driven decades of query expansion work in library science is addressed at the architectural level rather than patched at the query level.</p><blockquote><p>The next level beyond semantic search would be agentic/deep search, which uses the LLM to do iterative searching and evaluation - often using both lexical and semantic search methods </p></blockquote><p>The practical objections are real but not insurmountable. Librarians value Boolean as a first stage retriever because it is predictable, inspectable, and gives them direct control over what enters the result set. Abandoning it at the first stage means accepting that retrieval becomes probabilistic &#8212; you can no longer guarantee that a specific document will or will not appear for a given query. <a href="https://aarontay.substack.com/p/the-case-of-the-vanishing-hit-count">Hit counts become approximate or meaningless.</a> The ability to teach students a logical, reproducible search process is diminished.</p><p>These are genuine losses. But we should weigh them against what is gained. The vocabulary mismatch problem &#8212; the single largest source of recall failure in academic search &#8212; is substantially mitigated. The need for aggressive synonym expansion, and all the ranking noise it creates, is eliminated. And the overall architecture becomes simpler: instead of Boolean retrieval followed by BM25 ranking followed by (hopefully) neural reranking, you can move to a hybrid first-stage retrieval using both BM25 and dense embeddings, followed by a single reranking step.</p><p>Most of the search industry reached this conclusion two decades ago. Google, Bing, and virtually every major web search engine abandoned strict Boolean for first-stage retrieval by the early 2000s going for BM25. Among academic search systems, Semantic Scholar uses BM25 rather than Boolean as its first-stage retriever. The library world remains one of the last holdouts &#8212; not because Boolean is technically superior, but because our professional training, our teaching practices, and our vendor relationships are all built around it.</p><p>I am not suggesting this transition will be easy or that Boolean should vanish overnight. A hybrid approach &#8212; using both lexical methods like BM25 and semantic methods alongside or instead of strict Boolean &#8212; is the most realistic path. Scopus AI and top class tools are already moving in this direction. But we should be clear-eyed about what we are defending when we insist on Boolean as the foundation. We are defending a retrieval method whose core limitation &#8212; binary matching &#8212; is the root cause of many of the problems this post has described.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee (via ko-fi)</span></a></p><p></p><h2>The bottom line</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Ni1u!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Ni1u!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png 424w, https://substackcdn.com/image/fetch/$s_!Ni1u!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png 848w, https://substackcdn.com/image/fetch/$s_!Ni1u!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png 1272w, https://substackcdn.com/image/fetch/$s_!Ni1u!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Ni1u!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png" width="1157" height="658" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:658,&quot;width&quot;:1157,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:902047,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/191539701?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Ni1u!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png 424w, https://substackcdn.com/image/fetch/$s_!Ni1u!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png 848w, https://substackcdn.com/image/fetch/$s_!Ni1u!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png 1272w, https://substackcdn.com/image/fetch/$s_!Ni1u!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b2be2e9-6007-42d3-acd3-b7296272eb31_1157x658.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>LLM-to-Boolean is not worthless. But it is a minor component being marketed as the whole solution. It solves a narrow problem &#8212; helping novices who cannot construct any Boolean at all &#8212; while doing nothing for the majority who need better-ranked results. As a first-stage query construction aid paired with modern reranking, it could play a useful supporting role. On its own, with the same BM25 ranking underneath, it changes almost nothing that matters.</p><p>The horseless carriage eventually gave way to the automobile &#8212; a machine designed from the ground up around the capabilities of the engine, not around the form of what came before. Library search needs the same transition. The real bottleneck is not retrieval &#8212; it is ranking. And for complex queries, it is not even ranking &#8212; it is the absence of iterative, evaluative search processes that can reason about what they find.</p><p>The infrastructure to do better already exists. Semantic Scholar and PubMed have proven that two-stage architectures work at scale. Agentic deep search tools have demonstrated what is possible when LLMs are used as reasoning engines rather than Boolean generators. Some libraries are already taking this path &#8212; <a href="https://ital.corejournals.org/index.php/ital/article/view/17511/11968">Harvard Library, for instance, bypassed LLM-to-Boolean entirely for their special collections, building a discovery platform called Collections Explorer that relies on embedding models.</a></p><p>The question is whether library vendors will invest in these approaches, and whether we as a profession will demand they do &#8212; or whether we will keep admiring the horseless carriage because we can see how the reins work.</p><div class="captioned-button-wrap" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="CaptionedButtonToDOM"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! This post is public so feel free to share it.</p></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/p/the-horseless-carriage-of-ai-search?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p></div><p></p><p></p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p><a href="https://bsky.app/profile/metasynthesis.net/post/3ma4nlupfo22k">William Gunn first made this point to me.</a></p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>Librarians always worry about environment impacts of use of LLM, and in this case - one might be skeptical of the cost-benefit analysis of using LLMs to convery queries into Boolean</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-3" href="#footnote-anchor-3" class="footnote-number" contenteditable="false" target="_self">3</a><div class="footnote-content"><p><a href="https://www.staff.city.ac.uk/~sbrp622/papers/foundations_bm25_review.pdf?utm_source=chatgpt.com">BM25 was introduced in 1994, though it grew out of earlier probabilistic IR work from the 1970s and 1980</a>. <a href="https://opensourceconnections.com/blog/2015/10/16/bm25-the-next-generation-of-lucene-relevation/">By 2015/2016, popular commerical search platforms like Elasticsearch made BM25 the default over TF-IDF.</a></p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-4" href="#footnote-anchor-4" class="footnote-number" contenteditable="false" target="_self">4</a><div class="footnote-content"><p>I do think LLMs will eventually be able to generate expert searcher level search strategies. The path forward is agentic search combined with tool use (e.g. a system to check MeSH): an LLM that can construct an initial query, run it, evaluate the results against inclusion criteria, identify gaps in coverage, reformulate and expand the search, test the revised strategy against known relevant studies, and iterate until recall targets are met. This is exactly the way a professional search does it! Note: this is qualitatively different from generating a single Boolean string and hoping it works.  </p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-5" href="#footnote-anchor-5" class="footnote-number" contenteditable="false" target="_self">5</a><div class="footnote-content"><p>Some systems instruct LLMs to generate multiple phrase searches to be OR&#8217;d together (e.g. Primo Research Assistant) but the result is similar.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-6" href="#footnote-anchor-6" class="footnote-number" contenteditable="false" target="_self">6</a><div class="footnote-content"><p>Query expansion, and more broadly query reformulation (which encompasses expansion, term substitution, and structural transformation), remains an area of active research in information retrieval. That said, complex nested Boolean query construction receives relatively little attention in mainstream IR research, with evidence synthesis and, to some extent, patent and legal search being notable exceptions. More common approaches in current research include pseudo-relevance feedback, learned sparse expansion methods such as SPLADE, and <a href="https://x.com/nour_jedidi/status/2032142153460203529">dense retrieval techniques like HyDE (Hypothetical Document Embeddings)</a>, which generates a hypothetical answer document and uses its embedding as the query representation rather than expanding the query terms directly.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-7" href="#footnote-anchor-7" class="footnote-number" contenteditable="false" target="_self">7</a><div class="footnote-content"><p>Technically, variants like BM25F weight where the hit comes from, so a hit from full-text would be worth less than a match in the title or abstract but this is difficult to get right.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-8" href="#footnote-anchor-8" class="footnote-number" contenteditable="false" target="_self">8</a><div class="footnote-content"><p>I know everything is relative, there have been complaints about PubMed ATM of course.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-9" href="#footnote-anchor-9" class="footnote-number" contenteditable="false" target="_self">9</a><div class="footnote-content"><p>You have to account for the fact that currently Primo Research Assistant doesn&#8217;t search the local collections and some content owners like Elsevier, JSTOR have opted out.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-10" href="#footnote-anchor-10" class="footnote-number" contenteditable="false" target="_self">10</a><div class="footnote-content"><p>The study also tested PRA during its beta period with several major providers excluded, and PRA was judged on five returned items versus ten for conventional searches, so the comparison is suggestive rather than strictly like-for-like.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-11" href="#footnote-anchor-11" class="footnote-number" contenteditable="false" target="_self">11</a><div class="footnote-content"><p><a href="https://drive.google.com/file/d/1CDke4xGQFCuzgzpBj7dt92Fe0IMFr2Ij/view?usp=drivesdk">Stony Brook uses multiple concurrent agents for query construction, which is technically agentic </a>but fundamentally different from agentic search that does iterative deep search, and/or evaluate results e.g. Undermind, Consensus Deep Search. The agents here assemble a single query in parallel, then hand it off to Primo.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-12" href="#footnote-anchor-12" class="footnote-number" contenteditable="false" target="_self">12</a><div class="footnote-content"><p>How easy is it? Consider how even relatively smaller institutions are doing similar experiments. Essentially all you need to do is to hook up the input to a LLM API and prompt it to give a boolean output!</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-13" href="#footnote-anchor-13" class="footnote-number" contenteditable="false" target="_self">13</a><div class="footnote-content"><p>There is a middle path that avoids the need to pre-index embeddings for the entire collection: generate embeddings at query time and rerank only a small number of retrieved results, as Primo Research Assistant does with the top 30. This sidesteps the cost of indexing billions of records into a vector store. The trade-off is speed &#8212; computing embeddings on the fly for every query adds latency that users will notice, and the small reranking window means you are only re-sorting a tiny fraction of the candidate set. Reranking 30 results is better than reranking none, but it is a long way from reranking the top 500 or 1,000, where the real quality gains appear.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-14" href="#footnote-anchor-14" class="footnote-number" contenteditable="false" target="_self">14</a><div class="footnote-content"><p>There are studies that <a href="https://youtu.be/Mi-Bo1wRlFA?si=lUA1BwDoRAHI6uPh">suggest Primo Research Assistant isn&#8217;t too far behind in capability to advanced modern systems like Elicit or Undermind</a> but these studies often test with &#8220;Easy queries&#8221; and/or they test with queries where Primo Research Assistant has an advantage in terms of their index coverage (PRA includes monographs and other non-article type content).</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-15" href="#footnote-anchor-15" class="footnote-number" contenteditable="false" target="_self">15</a><div class="footnote-content"><p>I grant you that with BM25 ranking systems, most librarians could roughly convince themselves why a result was in the top 5 just by looking for stemmed term matches.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-16" href="#footnote-anchor-16" class="footnote-number" contenteditable="false" target="_self">16</a><div class="footnote-content"><p>I am old school enough to remember back in 2010s where the Summon mailing list would be abuzz by librarians angry that when comparing two queries, it made no logic sense because one gave more results when it should have less. This could have multiple explainations, for example, some expansion rule was silently triggered when number of results fell below some threshold.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-17" href="#footnote-anchor-17" class="footnote-number" contenteditable="false" target="_self">17</a><div class="footnote-content"><p>Some systems would need a hard match of at least X out of Y terms for the document to be considered for ranking, others might only drop out of strict Boolean mode if the query is beyond a certain length etc. </p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-18" href="#footnote-anchor-18" class="footnote-number" contenteditable="false" target="_self">18</a><div class="footnote-content"><p>One way you could test if a system was using BM25 as a retriever would be to enter 3 normal terms and one made up word. A Boolean system would definitely give you zero results. One that used BM25 for retriever would still given you some results. Of course, these days, the system could also be using a non-lexical semantic search system. </p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-19" href="#footnote-anchor-19" class="footnote-number" contenteditable="false" target="_self">19</a><div class="footnote-content"><p>There is a persistant myth among librarians that Google of the 2000s to 2010s wasn&#8217;t a lexical/keyword search system just because it didn&#8217;t do strict boolean. In fact, it was a mostly keyword search, just that it did not implement strict Boolean - at least in the 2010s, and if you knew a couple of tricks (check the cached web for what the crawler actually indexed, look at link text etc), the search results was more interpretable than you might think. Still, it was definitely far less interpretable and predictable than typical library databases.</p><p></p></div></div>]]></content:encoded></item><item><title><![CDATA[The agentic researcher - building custom, transparent and extensible workflows with Claude & MCP]]></title><description><![CDATA[Why generic LLM + academic MCP servers might be as good if not better than specalised Academic deep research]]></description><link>https://aarontay.substack.com/p/creating-your-own-research-assistant</link><guid isPermaLink="false">https://aarontay.substack.com/p/creating-your-own-research-assistant</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Mon, 23 Feb 2026 18:52:31 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!ln1-!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ln1-!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ln1-!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png 424w, https://substackcdn.com/image/fetch/$s_!ln1-!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png 848w, https://substackcdn.com/image/fetch/$s_!ln1-!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png 1272w, https://substackcdn.com/image/fetch/$s_!ln1-!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ln1-!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png" width="1208" height="666" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:666,&quot;width&quot;:1208,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:807559,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ln1-!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png 424w, https://substackcdn.com/image/fetch/$s_!ln1-!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png 848w, https://substackcdn.com/image/fetch/$s_!ln1-!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png 1272w, https://substackcdn.com/image/fetch/$s_!ln1-!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffa6d8137-11ed-47dd-a9b3-9e19fa014267_1208x666.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>When I last <a href="https://aarontay.substack.com/p/mcp-servers-and-academic-search-the">wrote about MCP servers</a> in the context of the <a href="https://www.wiley.com/en-us/solutions-partnerships/ai-solutions/">launch of Wiley&#8217;s AI Gateway</a> and the <a href="https://www.anthropic.com/news/claude-for-life-sciences#:~:text=PubMed%20provides%20access%20to%20millions%20of%20biomedical%20research%20articles%20and%20clinical%20studies%3B">PubMed MCP server/connector you could add to Claude.ai</a>, I received a few private messages from librarians and researchers who shared how much more they had gone beyond just connecting to pre-built MCP servers.</p><p>Most of them were using <a href="https://code.claude.com/docs/en/overview">Claude Code</a> or <a href="https://code.claude.com/docs/en/desktop">Claude Code Desktop</a>, which they used to:</p><p>a) vibe-code MCP servers that did not exist or were not offered, and run the servers locally</p><p>b) combine MCP servers and other tools with <a href="https://claude.com/skills">Claude Skills </a>for powerful workflows</p><p>Since then, I started exploring the use of Claude Code and Claude Code Desktop myself, and while I am still a rank novice in this area, I can see why people are so excited by the possibilities.</p><p>But before I walk through the practicalities, I want to make the case for why this matters &#8212; because it is not just about convenience. It represents an almost fundamentally different model for how academic search and workflows in general can work.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee (via ko-fi)</span></a></p><p></p><p>In my recent post on <a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">how &#8220;agentic&#8221; current academic deep research tools really are</a>, I found that while specialised deep research tools like <a href="https://consensus.app/home/blog/deep-search/">Consensus Deep Search</a> and <a href="http://undermind.ai">Undermind</a>, <a href="http://elicit.com">Elicit</a> , etc. , perform impressively within their designed parameters, but their agency is ultimately bounded by rigid, pre-programmed workflows. They execute complex, multi-step loops rapidly and cheaply, but the moment a research query steps outside those hardcoded tracks &#8212; requiring a novel combination of tools and capabilities such as filters, unconventional citation tree traversal, or data extraction the vendor did not anticipate &#8212; these fixed pathways become bottlenecks.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!gqVF!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!gqVF!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png 424w, https://substackcdn.com/image/fetch/$s_!gqVF!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png 848w, https://substackcdn.com/image/fetch/$s_!gqVF!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png 1272w, https://substackcdn.com/image/fetch/$s_!gqVF!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!gqVF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png" width="1193" height="683" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:683,&quot;width&quot;:1193,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1211688,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!gqVF!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png 424w, https://substackcdn.com/image/fetch/$s_!gqVF!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png 848w, https://substackcdn.com/image/fetch/$s_!gqVF!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png 1272w, https://substackcdn.com/image/fetch/$s_!gqVF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3ee6af82-0a5e-4ec9-b1e5-4ae3f507bc32_1193x683.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This highlights a fundamental tension: as frontier models become increasingly capable of advanced reasoning, forcing them through restrictive, &#8220;on-rails&#8221; product interfaces artificially caps their utility. These tools treat information retrieval as a static funnel rather than a dynamic, iterative process, leaving the researcher constrained by the vendor&#8217;s imagination.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mYiU!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mYiU!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg 424w, https://substackcdn.com/image/fetch/$s_!mYiU!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg 848w, https://substackcdn.com/image/fetch/$s_!mYiU!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!mYiU!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mYiU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg" width="1024" height="1024" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1024,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:153775,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mYiU!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg 424w, https://substackcdn.com/image/fetch/$s_!mYiU!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg 848w, https://substackcdn.com/image/fetch/$s_!mYiU!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!mYiU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0f55bced-5c15-4f0d-9f76-1b7db9617dcb_1024x1024.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>LLMs connected with MCP servers change this. Instead of a vendor-defined loop, it allows researchers to build custom, transparent, and extensible research environments. The AI is not limited to searching a single closed index. </p><p>For example, it can reach into a local Zotero library, query live institutional repositories, chain outputs from one search system into another, and execute code to analyse data on the fly. </p><blockquote><p>The agent moves from being a search tool to something closer to a real research assistant that can have autonomy to &#8220;decide&#8221; which tools to use and in which order and/or an assistant that the researcher can instruct via Claude Skills.</p></blockquote><p>The rest of this post lays out the evidence that this is not just a theoretical advantage, walks through how to actually set it up, and addresses the current limitations of such a setup and implications for librarians.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe now&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/subscribe?"><span>Subscribe now</span></a></p><h2>Can generic LLMs actually compete on retrieval?</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!e0kX!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!e0kX!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png 424w, https://substackcdn.com/image/fetch/$s_!e0kX!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png 848w, https://substackcdn.com/image/fetch/$s_!e0kX!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png 1272w, https://substackcdn.com/image/fetch/$s_!e0kX!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!e0kX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png" width="1192" height="661" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:661,&quot;width&quot;:1192,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:801666,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!e0kX!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png 424w, https://substackcdn.com/image/fetch/$s_!e0kX!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png 848w, https://substackcdn.com/image/fetch/$s_!e0kX!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png 1272w, https://substackcdn.com/image/fetch/$s_!e0kX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6ecec02-0a41-4ab4-8476-a0590eb29f11_1192x661.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The obvious objection is: surely purpose-built academic search tools such as Elicit.com, Undermind.ai, Consensus retrieve better results than a general-purpose LLMs? The evidence is currently more mixed than you might expect.</p><p>A <a href="https://www.youtube.com/watch?si=Bed9e-tlienLvFd_&amp;v=rKhwikQe26w&amp;feature=youtu.be">video study by Moara</a> claimed Claude's web search (with no special academic connectors) beat Undermind, Elicit, SciSpace, Consensus, and Scholar Labs on retrieval quality. </p><div id="youtube2-rKhwikQe26w" class="youtube-wrap" data-attrs="{&quot;videoId&quot;:&quot;rKhwikQe26w&quot;,&quot;startTime&quot;:null,&quot;endTime&quot;:null}" data-component-name="Youtube2ToDOM"><div class="youtube-inner"><iframe src="https://www.youtube-nocookie.com/embed/rKhwikQe26w?rel=0&amp;autoplay=0&amp;showinfo=0&amp;enablejsapi=0" frameborder="0" loading="lazy" gesture="media" allow="autoplay; fullscreen" allowautoplay="true" allowfullscreen="true" width="728" height="409"></iframe></div></div><p>This study has significant methodological problems: it tested only a single query and looked only at the top 10 results, the evaluation relied mostly on LLM-as-judge (ChatGPT, Gemini and Claude may be biased towards output from fellow LLMs despite attempts to anonymize), and the query may have favoured grey literature that specialised tools cannot access. </p><p>That said, the human evaluators agreed with the ranking, and it is notable that Undermind &#8212; which I generally regard as among the strongest specialised tools &#8212; came second (See also <a href="https://www.youtube.com/watch?v=c1xBIMKQVpY">earlier study by Moara that ranked Undermind first among all specialised tools</a>).</p><p>I have found similar patterns in my own testing, though I stress these are illustrative examples rather than systematic evaluations. When asked whether OpenAlex can be used alone for systematic reviews, <a href="https://app.undermind.ai/report/a591d6945b262b04e1d96ebce005f332ade1ee017299b94bdb26321733d14e96">Undermind found two relevant items</a>. Claude (without any specialised MCP server) found the same two,<a href="https://www.fhi.no/en/publ/2023/Evaluation-of-OpenAlex/"> plus a third relevant grey literature report </a>that was not in Semantic Scholar&#8217;s index. </p><div class="bluesky-wrap outer" style="height: auto; display: flex; margin-bottom: 24px;" data-attrs="{&quot;postId&quot;:&quot;3mf4qdvm5os2t&quot;,&quot;authorDid&quot;:&quot;did:plc:3z5zbwdbqmw2qobnb5zsfdbu&quot;,&quot;authorName&quot;:&quot;Aaron Tay&quot;,&quot;authorHandle&quot;:&quot;aarontay.bsky.social&quot;,&quot;authorAvatarUrl&quot;:&quot;https://cdn.bsky.app/img/avatar/plain/did:plc:3z5zbwdbqmw2qobnb5zsfdbu/bafkreiezhmit3ar7icmsmjtz64n4rspz6uarmpeqbeoyhiej74qbowy7ri@jpeg&quot;,&quot;text&quot;:&quot;Undermind is the only specialised academic search I tested that put up a good fight finding 2-3 relevant papers at the top app.undermind.ai/report/a591d.... But it still fails to find grey literature like www.fhi.no/en/publ/2023... that Claude spotted.&quot;,&quot;createdAt&quot;:&quot;2026-02-18T09:11:45.040Z&quot;,&quot;uri&quot;:&quot;at://did:plc:3z5zbwdbqmw2qobnb5zsfdbu/app.bsky.feed.post/3mf4qdvm5os2t&quot;,&quot;imageUrls&quot;:[&quot;https://cdn.bsky.app/img/feed_thumbnail/plain/did:plc:3z5zbwdbqmw2qobnb5zsfdbu/bafkreie2e3rkh4kwcdykrqoexucevn7l2ybbtwujgfgtq6lfjag6ziox7i@jpeg&quot;]}" data-component-name="BlueskyCreateBlueskyEmbed"><iframe id="bluesky-3mf4qdvm5os2t" data-bluesky-id="3206031818876687" src="https://embed.bsky.app/embed/did:plc:3z5zbwdbqmw2qobnb5zsfdbu/app.bsky.feed.post/3mf4qdvm5os2t?id=3206031818876687" width="100%" style="display: block; flex-grow: 1;" frameborder="0" scrolling="no"></iframe></div><p></p><p>Most striking was how Consensus Deep Search failed to find any relevant papers on this query, while Claude even with the Consensus MCP server (which is limited to just the top 3 results) did find relevant papers. This is a peculiar case where Consensus&#8217;s deep search mode, spending far more time and compute, produced worse results than its own index queried through a basic MCP connection.</p><p></p><div class="bluesky-wrap outer" style="height: auto; display: flex; margin-bottom: 24px;" data-attrs="{&quot;postId&quot;:&quot;3mf4q6nes4c2t&quot;,&quot;authorDid&quot;:&quot;did:plc:3z5zbwdbqmw2qobnb5zsfdbu&quot;,&quot;authorName&quot;:&quot;Aaron Tay&quot;,&quot;authorHandle&quot;:&quot;aarontay.bsky.social&quot;,&quot;authorAvatarUrl&quot;:&quot;https://cdn.bsky.app/img/avatar/plain/did:plc:3z5zbwdbqmw2qobnb5zsfdbu/bafkreiezhmit3ar7icmsmjtz64n4rspz6uarmpeqbeoyhiej74qbowy7ri@jpeg&quot;,&quot;text&quot;:&quot;As you can see below Claude easily spots the critical Stansfield et al. (2025) paper by searching Consensus. Curious that Consensus Deep Search that does a ton more searches either fails to find it or somehow ranks it so low it isnt picked up?&quot;,&quot;createdAt&quot;:&quot;2026-02-18T09:08:48.637Z&quot;,&quot;uri&quot;:&quot;at://did:plc:3z5zbwdbqmw2qobnb5zsfdbu/app.bsky.feed.post/3mf4q6nes4c2t&quot;,&quot;imageUrls&quot;:[&quot;https://cdn.bsky.app/img/feed_thumbnail/plain/did:plc:3z5zbwdbqmw2qobnb5zsfdbu/bafkreib3kpwsfn2d4rpjxgctbluzoylczgago3qulkk7s5k3gco54vs6aa@jpeg&quot;]}" data-component-name="BlueskyCreateBlueskyEmbed"><iframe id="bluesky-3mf4q6nes4c2t" data-bluesky-id="13034535484179832" src="https://embed.bsky.app/embed/did:plc:3z5zbwdbqmw2qobnb5zsfdbu/app.bsky.feed.post/3mf4q6nes4c2t?id=13034535484179832" width="100%" style="display: block; flex-grow: 1;" frameborder="0" scrolling="no"></iframe></div><p></p><p>A more systematic comparison comes from <a href="https://youtu.be/Mi-Bo1wRlFA?si=lUA1BwDoRAHI6uPh">a librarian who tested 11 queries</a> across multiple tools. Using a scoring rubric, Claude (again without any special MCP servers) ended up on top ahead of Consensus, Elicit, and Primo Research Assistant, though not by a statistically significant margin. </p><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://youtu.be/Mi-Bo1wRlFA?si=lUA1BwDoRAHI6uPh" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!pgqh!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbaa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png 424w, https://substackcdn.com/image/fetch/$s_!pgqh!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbaa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png 848w, https://substackcdn.com/image/fetch/$s_!pgqh!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbaa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png 1272w, https://substackcdn.com/image/fetch/$s_!pgqh!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbaa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!pgqh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbaa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png" width="1307" height="717" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/baa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:717,&quot;width&quot;:1307,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:&quot;https://youtu.be/Mi-Bo1wRlFA?si=lUA1BwDoRAHI6uPh&quot;,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!pgqh!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbaa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png 424w, https://substackcdn.com/image/fetch/$s_!pgqh!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbaa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png 848w, https://substackcdn.com/image/fetch/$s_!pgqh!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbaa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png 1272w, https://substackcdn.com/image/fetch/$s_!pgqh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbaa674c8-8c05-4094-b55b-3f0a69dd7610_1307x717.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Part of the reason for this is that some queries were best answered by non-journal content &#8212; monographs and grey literature &#8212; where Claude and Primo (which draws on broader library collections) had a structural advantage over tools that rely primarily on OpenAlex or Semantic Scholar.</p><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!WPNP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!WPNP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png 424w, https://substackcdn.com/image/fetch/$s_!WPNP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png 848w, https://substackcdn.com/image/fetch/$s_!WPNP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png 1272w, https://substackcdn.com/image/fetch/$s_!WPNP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!WPNP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png" width="1200" height="675" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/dd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:675,&quot;width&quot;:1200,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1237113,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!WPNP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png 424w, https://substackcdn.com/image/fetch/$s_!WPNP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png 848w, https://substackcdn.com/image/fetch/$s_!WPNP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png 1272w, https://substackcdn.com/image/fetch/$s_!WPNP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd70728d-2d11-4649-9af3-a67f2927253d_1200x675.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>None of this constitutes definitive evidence that generic LLMs are superior. The sample sizes are small, the methodologies vary, and important details are often unclear (for instance, it is not always specified whether deep search modes were used for the specialised tools, or whether Claude was running in its more powerful &#8220;Research&#8221; mode). What the evidence does suggest is that generic LLMs are not clearly worse at finding relevant sources, particularly for queries that benefit from content outside journal &amp; preprint article indexes.</p><p>To be clear, I am referring to the ability to find relevant sources. Specialised tools offer other affordances  not offered by using generic LLMs. This includes structured output with academic references, useful visualizations and methodological transparency (sometimes). But on raw retrieval, the gap has narrowed considerably.</p><blockquote><p>This is why I now recommend users combine a specialised academic deep research tool (such as Undermind, Consensus, or Elicit in their deep modes) with a generic deep research tool (such as OpenAI or Gemini Deep Research, or Claude with Research mode) for greater coverage. </p></blockquote><p>This is particularly important the more humanities-oriented or less journal-centric your subject area is, as the specialised tools tend to rely on OpenAlex and Semantic Scholar, which have weaker coverage in these areas.</p><h2>What are MCP servers and why do they matter here?</h2><p>If generic LLMs are already competitive at retrieval , the obvious next question is: how do you make this reliable rather than hit-or-miss?</p><p>If indeed, general web-backed LLM search can match specialized tools on top-N relevance for some query types (especially those requiring grey literature or books), could we do even better with access to specialised academic content?</p><p>The problem with relying on general web search for academic work is that even when explicitly instructed to find peer-reviewed sources,  LLMs will still sometimes cite blog posts, news articles, and other non-academic content. They draw from the open web and do not always distinguish between a journal article and a well-written blog post on the same topic. Giving these models a direct connection to academic indexes, rather than hoping they stumble on the right content through web search, is what turns an occasionally useful capability into a dependable one.</p><p>This is exactly what the Model Context Protocol enables. MCP is an open standard, supported to some extent by all three major AI labs (Anthropic, OpenAI, and Google), that allows LLMs to connect to external tools and data sources. Give a model direct access to PubMed, Scopus, or your institutional repository, and it no longer has to guess whether what it found on the web is actually a scholarly source. </p><p>And if you can give it access to paywalled full text via publisher MCP servers, such as Wiley&#8217;s Gateway AI server, you could potentially give it an advantage over specialised tools like Undermind that rely only on open corpora like Semantic Scholar.</p><p>There is already considerable buzz around setting up MCP servers for library-specific resources &#8212; the library catalogue, discovery services, institutional repositories, and more. This <a href="https://youtu.be/SgFsxlCQvOE">CNI talk</a> is an excellent example of what leading libraries like Northeastern are currently doing in this space. </p><div id="youtube2-SgFsxlCQvOE" class="youtube-wrap" data-attrs="{&quot;videoId&quot;:&quot;SgFsxlCQvOE&quot;,&quot;startTime&quot;:null,&quot;endTime&quot;:null}" data-component-name="Youtube2ToDOM"><div class="youtube-inner"><iframe src="https://www.youtube-nocookie.com/embed/SgFsxlCQvOE?rel=0&amp;autoplay=0&amp;showinfo=0&amp;enablejsapi=0" frameborder="0" loading="lazy" gesture="media" allow="autoplay; fullscreen" allowautoplay="true" allowfullscreen="true" width="728" height="409"></iframe></div></div><p></p><p>The reasoning is straightforward. Whilst librarians and some power users reach for specialised deep research tools like Elicit, Undermind, Consensus, and Scite Assistant, most students and researchers spend the bulk of their time in ChatGPT, Gemini, or Claude. So why not meet them where they are? </p><p>MCP servers come in two varieties: remote servers, which are hosted by someone else and you simply point your LLM interface to them; and local servers, which you run on your own machine.</p><blockquote><p><strong>A necessary warning </strong>: connecting your LLM to MCP servers carries risks. The operators of remote MCP servers can see your queries, and there are security risks including prompt injection. Running local servers from unverified GitHub repositories carries its own risks (since it involves running code on your machine!), though it does improve privacy since queries stay on your machine.</p></blockquote><h2>Setting up remote MCP servers</h2><p>Remote MCP servers are the simplest to get started with. In Claude.ai, you can find Consensus, PubMed, and Scholar Gateway listed as connectors that are available that can be added directly. Scite.ai has to be manually added.</p><p>Support for MCP servers is more complicated with ChatGPT.com. While ChatGPT recently started supporting MCP servers through its apps system, it does not yet list any academic search connectors in its store at the time of writing. You can work around this, though it requires a paid account and a somewhat hacky process:</p><ol><li><p>Go to Settings, then Apps, then Advanced settings, and <a href="https://developers.openai.com/api/docs/guides/developer-mode/">enable Developer mode</a>.</p></li><li><p>Open ChatGPT Apps settings and click &#8220;Create app&#8221; next to Advanced settings.</p></li><li><p>Create an app for your remote MCP server using the server URL.</p></li></ol><p> The MCP server URLs that work without any authentication are:</p><ul><li><p><strong>Consensus</strong>: <code>https://mcp.consensus.app/mcp</code> (<a href="https://consensus.app/home/mcp/">documentation</a>)</p></li><li><p><strong>PubMed</strong>: <code>https://pubmed.mcp.claude.com/mcp</code> (hosted by Anthropic as a connector for Claude, this is the same connector <a href="https://aarontay.substack.com/p/mcp-servers-and-academic-search-the">I tested in my earlier blog post</a>)</p></li><li><p><strong>Scite.ai</strong>: <code>https://api.scite.ai/mcp</code> (<a href="https://scite.ai/mcp">documentation</a>)</p></li></ul><p>Edit : As of 28 Feb, Scite is now listed in ChatGPT store, so you no longer need to turn on developer mode. Scispace.com has followed suit as well.</p><p>Edit : As of 29 April, Scite is now listed in list of Claude supported Connectors, so you can just add directly as well.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!zLcx!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!zLcx!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png 424w, https://substackcdn.com/image/fetch/$s_!zLcx!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png 848w, https://substackcdn.com/image/fetch/$s_!zLcx!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png 1272w, https://substackcdn.com/image/fetch/$s_!zLcx!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!zLcx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png" width="410" height="622" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d6006b7a-c885-4e61-8828-956236e6e61a_410x622.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:622,&quot;width&quot;:410,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!zLcx!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png 424w, https://substackcdn.com/image/fetch/$s_!zLcx!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png 848w, https://substackcdn.com/image/fetch/$s_!zLcx!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png 1272w, https://substackcdn.com/image/fetch/$s_!zLcx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd6006b7a-c885-4e61-8828-956236e6e61a_410x622.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Once set up, you can select these tools for use in your conversations or let ChatGPT decide when to invoke them.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!rsJg!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!rsJg!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png 424w, https://substackcdn.com/image/fetch/$s_!rsJg!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png 848w, https://substackcdn.com/image/fetch/$s_!rsJg!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png 1272w, https://substackcdn.com/image/fetch/$s_!rsJg!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!rsJg!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png" width="747" height="337" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:337,&quot;width&quot;:747,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!rsJg!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png 424w, https://substackcdn.com/image/fetch/$s_!rsJg!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png 848w, https://substackcdn.com/image/fetch/$s_!rsJg!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png 1272w, https://substackcdn.com/image/fetch/$s_!rsJg!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c3045a3-89c7-4beb-8ae8-b6881122bbb0_747x337.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Below you can see the tool calling and searching Scite.ai</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!heTZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!heTZ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png 424w, https://substackcdn.com/image/fetch/$s_!heTZ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png 848w, https://substackcdn.com/image/fetch/$s_!heTZ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png 1272w, https://substackcdn.com/image/fetch/$s_!heTZ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!heTZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png" width="1042" height="750" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:750,&quot;width&quot;:1042,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!heTZ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png 424w, https://substackcdn.com/image/fetch/$s_!heTZ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png 848w, https://substackcdn.com/image/fetch/$s_!heTZ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png 1272w, https://substackcdn.com/image/fetch/$s_!heTZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0d3ca6db-65e1-402a-80d1-379e9b9413a4_1042x750.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Edit : <a href="https://www.youtube.com/watch?v=gcMel2guYE8">As of 25 March , Consensus is now listed in Claude Connectors (with ChatGPT coming soon), so you no longer need to create a custom MCP entry. It also automatically authenticates with your Consensus account , which will then give you access to the top 5 results.</a></p><p>Some limitations to be aware of: the <a href="https://consensus.app/home/mcp/">Consensus MCP server returns only the top 3 results out of 20 by default (though you can request for a API key)</a>. <a href="https://scite.ai/mcp">The Scite MCP server provides access to open access citation data and metadata by default, though they note that institutional subscriptions can unlock additional content</a>. It is worth reading the documentation pages for each server to understand their full capabilities (e.g. search parameters, citation searching capabilities).</p><h2>Setting up local MCP servers</h2><p>Remote servers are limited to what is available. Code for running Semantic Scholar or OpenAlex MCP servers exists on GitHub, but nobody hosts these as free remote servers. </p><p>And if the MCP server you want does not exist at all, you can attempt to vibe-code one yourself (assuming an API exists for the source you want to connect to) and run it locally.</p><blockquote><p>Warning : Again there are risks in running unverified MCP server code you find on GitHub and the ones you vibe code might have security vulnerabilities that can be exploited with prompt injection.</p></blockquote><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!CdxZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!CdxZ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png 424w, https://substackcdn.com/image/fetch/$s_!CdxZ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png 848w, https://substackcdn.com/image/fetch/$s_!CdxZ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png 1272w, https://substackcdn.com/image/fetch/$s_!CdxZ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!CdxZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png" width="708" height="514" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:514,&quot;width&quot;:708,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!CdxZ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png 424w, https://substackcdn.com/image/fetch/$s_!CdxZ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png 848w, https://substackcdn.com/image/fetch/$s_!CdxZ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png 1272w, https://substackcdn.com/image/fetch/$s_!CdxZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F042359f6-c64b-425e-8aa3-e9e4da4e2409_708x514.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Many early adopters are using Claude Code , Claude Desktop or Claude Cowork for this, both of which support local MCP servers. In my own Claude Desktop setup, I have configured and added several local MCP servers (with code I found on GitHub) alongside the remote ones:</p><ul><li><p>A <a href="https://github.com/54yyyu/zotero-mcp">Zotero MCP server</a> that connects Claude to my local reference library</p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!91iC!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!91iC!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png 424w, https://substackcdn.com/image/fetch/$s_!91iC!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png 848w, https://substackcdn.com/image/fetch/$s_!91iC!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png 1272w, https://substackcdn.com/image/fetch/$s_!91iC!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!91iC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png" width="708" height="1049" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/a2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1049,&quot;width&quot;:708,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!91iC!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png 424w, https://substackcdn.com/image/fetch/$s_!91iC!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png 848w, https://substackcdn.com/image/fetch/$s_!91iC!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png 1272w, https://substackcdn.com/image/fetch/$s_!91iC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2db0f39-3e51-4b6c-9f7f-7a5d09a482ce_708x1049.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><ul><li><p>A <a href="https://crates.io/crates/rust-research-mcp">Rust Research MCP server</a> that connects to multiple academic search systems including Semantic Scholar, OpenAlex, Crossref etc.</p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!_xCZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!_xCZ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png 424w, https://substackcdn.com/image/fetch/$s_!_xCZ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png 848w, https://substackcdn.com/image/fetch/$s_!_xCZ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png 1272w, https://substackcdn.com/image/fetch/$s_!_xCZ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!_xCZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png" width="434" height="921" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/319c5e88-4722-4be9-b665-c0fab9729272_434x921.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:921,&quot;width&quot;:434,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!_xCZ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png 424w, https://substackcdn.com/image/fetch/$s_!_xCZ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png 848w, https://substackcdn.com/image/fetch/$s_!_xCZ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png 1272w, https://substackcdn.com/image/fetch/$s_!_xCZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F319c5e88-4722-4be9-b665-c0fab9729272_434x921.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><ul><li><p>A custom OpenAlex MCP server that I had Claude Opus 4.6 vibe-code using the OpenAlex API as an experiment.</p></li></ul><p>If you are not comfortable with Python or coding in general, the installation instructions for these servers may look intimidating. But you can use Claude Code itself and ask it to install these packages for you!</p><h2>The real advantage: combining tools through Skills</h2><p>The retrieval comparisons above are interesting, but they miss the more fundamental point. The real advantage of the MCP approach is not that it searches better &#8212; it is that it enables workflows that no single vendor anticipated.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!pvWP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!pvWP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png 424w, https://substackcdn.com/image/fetch/$s_!pvWP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png 848w, https://substackcdn.com/image/fetch/$s_!pvWP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png 1272w, https://substackcdn.com/image/fetch/$s_!pvWP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!pvWP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png" width="1316" height="723" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/db5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:723,&quot;width&quot;:1316,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1329177,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!pvWP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png 424w, https://substackcdn.com/image/fetch/$s_!pvWP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png 848w, https://substackcdn.com/image/fetch/$s_!pvWP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png 1272w, https://substackcdn.com/image/fetch/$s_!pvWP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb5cb7d4-e90c-4e7a-8d2a-0634feb6aaa9_1316x723.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Here is a simple but concrete example: I asked Claude to search PubMed for papers on a topic, take the top 5 ranked results, and then use the Scite MCP server to retrieve mentioning and contrasting citations for each. </p><blockquote><p>See also in <a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">my last blog post with my test of &#8220;Find me papers that could/should have been cited by Paper &#8216;The state of OA: a large-scale analysis of the prevalence and impact of Open Access articles&#8217; but were not.&#8221;</a></p></blockquote><p>Claude successfully chained or &#8220;orchestrated&#8221; both tools together to produce exactly what I wanted<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a>. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Ac0m!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Ac0m!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png 424w, https://substackcdn.com/image/fetch/$s_!Ac0m!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png 848w, https://substackcdn.com/image/fetch/$s_!Ac0m!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png 1272w, https://substackcdn.com/image/fetch/$s_!Ac0m!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Ac0m!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png" width="719" height="779" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:779,&quot;width&quot;:719,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Ac0m!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png 424w, https://substackcdn.com/image/fetch/$s_!Ac0m!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png 848w, https://substackcdn.com/image/fetch/$s_!Ac0m!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png 1272w, https://substackcdn.com/image/fetch/$s_!Ac0m!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff5531432-09eb-4434-8d1d-17fb33a2e21b_719x779.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!q4Qb!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!q4Qb!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png 424w, https://substackcdn.com/image/fetch/$s_!q4Qb!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png 848w, https://substackcdn.com/image/fetch/$s_!q4Qb!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png 1272w, https://substackcdn.com/image/fetch/$s_!q4Qb!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!q4Qb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png" width="748" height="713" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:713,&quot;width&quot;:748,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!q4Qb!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png 424w, https://substackcdn.com/image/fetch/$s_!q4Qb!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png 848w, https://substackcdn.com/image/fetch/$s_!q4Qb!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png 1272w, https://substackcdn.com/image/fetch/$s_!q4Qb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F735a3db7-b64f-4d7a-ae97-50987afe64d2_748x713.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This is a trivial example and you get more fancy tasks where no single existing tool offers the specific workflow you want. With Claude+MCP, I did not need to wait for a vendor to build it.</p><p>This composability extends further through <a href="https://claude.com/skills">Claude Skills</a>, which are essentially predetermined prompts that Claude uses when triggered. </p><p>For example, you can define a &#8220;literature review&#8221; skill that searches multiple MCP servers (OpenAlex, Semantic Scholar, general web and your Zotero library), combines the results and writes a synthesis.</p><p>Skills are written in markdown and defined in natural language, so creating and modifying them requires no coding ability. Claude can even guide you through creating a skill by asking what you want it to do.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!eK_3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!eK_3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png 424w, https://substackcdn.com/image/fetch/$s_!eK_3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png 848w, https://substackcdn.com/image/fetch/$s_!eK_3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png 1272w, https://substackcdn.com/image/fetch/$s_!eK_3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!eK_3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png" width="1456" height="681" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:681,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!eK_3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png 424w, https://substackcdn.com/image/fetch/$s_!eK_3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png 848w, https://substackcdn.com/image/fetch/$s_!eK_3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png 1272w, https://substackcdn.com/image/fetch/$s_!eK_3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F88cab5e2-0396-4869-8dff-2948ac6d4965_1887x883.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The remaining steps should be self-explanatory </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Z0hK!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Z0hK!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png 424w, https://substackcdn.com/image/fetch/$s_!Z0hK!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png 848w, https://substackcdn.com/image/fetch/$s_!Z0hK!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png 1272w, https://substackcdn.com/image/fetch/$s_!Z0hK!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Z0hK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png" width="934" height="713" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:713,&quot;width&quot;:934,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Z0hK!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png 424w, https://substackcdn.com/image/fetch/$s_!Z0hK!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png 848w, https://substackcdn.com/image/fetch/$s_!Z0hK!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png 1272w, https://substackcdn.com/image/fetch/$s_!Z0hK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2beced6c-8472-4a7c-9cf8-d31e79932169_934x713.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>You could easily modify such a skill to only show results found by search that is not already in your Zotero library, or to create an entirely different search workflow. For a more advanced example, see <a href="https://www.linkedin.com/posts/alfredhwallace_better-ai-is-not-about-fetching-more-facts-activity-7420923355597561856-QjxR?utm_source=share&amp;utm_medium=member_desktop&amp;rcm=ACoAAADydNkB8cFBZ48tGuFjE4yHqQ6N6mBWEyE">Alfred Wallace&#8217;s skill design</a>, which is inspired by <a href="https://www.linkedin.com/feed/update/urn:li:activity:7419936708961472512/">work on guiding agentic retrievers on when to search broadly versus when to explore locally</a>. More advanced usage can involve adding resources and scripts for the skill to use.</p><p>The key insight is that everything is defined in natural language, so it is easy to change. The researcher defines the workflow, not the vendor.</p><h2>Limitations and open questions</h2><p>I&#8217;m only scratching the surface here. I&#8217;ve been hearing about the incredible workflows researchers and librarians are building by combining these tools. In essence, the process is now this simple:</p><ul><li><p>First: If you can access a source via API, you can &#8216;vibe code&#8217; an MCP server to talk to it.</p></li><li><p>Second: You create a skill in natural language to trigger that server and mash it up with anything else.</p></li><li><p>Third: There is no third step.</p></li></ul><p>In theory, you can  set up a skill or flow to do</p><ul><li><p>a cochrane type systematic review flow that involving coming up with inclusion criteria, searching and downloading from multiple sources, use the LLM to Screen etc.</p></li><li><p>searching for papers to do bibliometric analysis using a tool like <a href="https://github.com/Valdecy/pybibx">pybibx</a>, </p></li><li><p>comparison of the citations made to 2 different papers in the same area</p></li><li><p>some gap analysis etc.</p></li></ul><p></p><p>The only academic related platform that can match the capabilities of this setup is <a href="https://scispace.com/agents">SciSpace Agents</a> that allows you to hook and connect a huge variety of premade tools. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!vyQn!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!vyQn!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png 424w, https://substackcdn.com/image/fetch/$s_!vyQn!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png 848w, https://substackcdn.com/image/fetch/$s_!vyQn!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png 1272w, https://substackcdn.com/image/fetch/$s_!vyQn!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!vyQn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png" width="564" height="722" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:722,&quot;width&quot;:564,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:52674,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!vyQn!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png 424w, https://substackcdn.com/image/fetch/$s_!vyQn!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png 848w, https://substackcdn.com/image/fetch/$s_!vyQn!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png 1272w, https://substackcdn.com/image/fetch/$s_!vyQn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7ab09f59-4183-4246-8612-3c9ff7f62ba3_564x722.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!CQ8n!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!CQ8n!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png 424w, https://substackcdn.com/image/fetch/$s_!CQ8n!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png 848w, https://substackcdn.com/image/fetch/$s_!CQ8n!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png 1272w, https://substackcdn.com/image/fetch/$s_!CQ8n!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!CQ8n!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png" width="982" height="972" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:972,&quot;width&quot;:982,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:137438,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!CQ8n!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png 424w, https://substackcdn.com/image/fetch/$s_!CQ8n!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png 848w, https://substackcdn.com/image/fetch/$s_!CQ8n!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png 1272w, https://substackcdn.com/image/fetch/$s_!CQ8n!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F44033c18-9c81-4a83-b508-0da1b66f53a0_982x972.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>SciSpace Agents as an alternative is far less daunting technically to use but as you can expect, it is costly.</p><p>Still there are limitations</p><h3><strong>The technical barrier</strong></h3><p>Setting up remote MCP servers is straightforward. Configuring local servers, vibe-coding custom ones, writing effective Skills, and ensuring secure operations requires a level of technical comfort that most researchers and many librarians do not currently have. This is not a minor caveat &#8212; it is a significant barrier to adoption.</p><h3>Privacy and security</h3><p>I flagged this above but it deserves emphasis. For researchers working on sensitive topics &#8212; anything from commercial R&amp;D to clinical research involving patient data &#8212; queries sent to remote MCP servers are visible to their operators. This is not a theoretical concern. Libraries routinely fight to protect patron privacy, and recommending MCP server setups without clearly communicating this risk would be irresponsible.</p><h3>Reproducibility and interpretability</h3><p>Every user&#8217;s MCP environment is different &#8212; different servers installed, different Skills configured, different model versions. If I run a literature search through my Claude Desktop setup and you run the same query through yours, we will likely get different results even with the same query. </p><p>Ironically, the fixed workflows of specialised tools, which I criticised above for limiting flexibility, do at least provide a more consistent and documentable search process. There is a genuine tension here: the flexibility that makes the MCP approach powerful is the same property that makes it difficult to reproduce. Perhaps future practice would require submitting your entire Claude Code setup as part of a systematic review&#8217;s methodology, but we are far from established norms on this.</p><h3>Cost</h3><p>Claude Code and Claude Desktop with heavy tool use consume tokens rapidly. For a library or research group considering whether to invest in configuring MCP environments versus subscribing to Undermind or Consensus, the cost comparison matters. Specialised tools offer flat-rate subscriptions with predictable costs; the MCP approach scales with usage in ways that can be difficult to forecast<strong>.</strong></p><p>However with techniques like clever use of <a href="https://claude.com/skills">Claude Skills</a> to load only necessary context instead of all MCP servers, <a href="https://platform.claude.com/docs/en/build-with-claude/compaction">Server-side context compaction for managing long conversations that approach context window limits</a> &amp; <a href="https://www.anthropic.com/engineering/code-execution-with-mcp">code execution where LLMs write code to call tools instead of direct tool calls, this problem may be reduced.</a></p><p></p><h2>Implications for libraries</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!rePO!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!rePO!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png 424w, https://substackcdn.com/image/fetch/$s_!rePO!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png 848w, https://substackcdn.com/image/fetch/$s_!rePO!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png 1272w, https://substackcdn.com/image/fetch/$s_!rePO!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!rePO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png" width="1203" height="670" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/daba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:670,&quot;width&quot;:1203,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:988112,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!rePO!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png 424w, https://substackcdn.com/image/fetch/$s_!rePO!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png 848w, https://substackcdn.com/image/fetch/$s_!rePO!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png 1272w, https://substackcdn.com/image/fetch/$s_!rePO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdaba55b7-78e0-4759-bc0f-c723bac0632e_1203x670.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Despite these limitations, the direction of travel seems clear, and it has significant implications for libraries.</p><p><a href="https://www.linkedin.com/posts/activity-7420125483293548544-J1yr/?utm_source=share&amp;utm_medium=member_desktop&amp;rcm=ACoAAADydNkB8cFBZ48tGuFjE4yHqQ6N6mBWEyE">Alfred Wallace, a librarian who is perhaps a leader in exploring what is possible with MCP in research contexts, has been experimenting with building comprehensive research agent setups</a> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!qZJa!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!qZJa!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png 424w, https://substackcdn.com/image/fetch/$s_!qZJa!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png 848w, https://substackcdn.com/image/fetch/$s_!qZJa!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png 1272w, https://substackcdn.com/image/fetch/$s_!qZJa!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!qZJa!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png" width="638" height="674" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:674,&quot;width&quot;:638,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!qZJa!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png 424w, https://substackcdn.com/image/fetch/$s_!qZJa!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png 848w, https://substackcdn.com/image/fetch/$s_!qZJa!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png 1272w, https://substackcdn.com/image/fetch/$s_!qZJa!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc981572c-9cfb-4459-bb3e-96ea075fcb87_638x674.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><a href="https://www.linkedin.com/posts/alfredhwallace_claude-activity-7421986340428472320-sUAE?utm_source=share&amp;utm_medium=member_desktop&amp;rcm=ACoAAADydNkB8cFBZ48tGuFjE4yHqQ6N6mBWEyE">He has raised the provocative idea of &#8220;AI tool fine-tuning as a service&#8221; from libraries. </a>The concept is that librarians, with their understanding of information retrieval principles and research methodology, are well-positioned to configure these environments for researchers &#8212; selecting appropriate MCP servers, writing effective Skills, and advising on the limitations of different configurations.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Yvah!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Yvah!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png 424w, https://substackcdn.com/image/fetch/$s_!Yvah!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png 848w, https://substackcdn.com/image/fetch/$s_!Yvah!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png 1272w, https://substackcdn.com/image/fetch/$s_!Yvah!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Yvah!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png" width="493" height="311" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/11591c6e-f642-48ea-9351-7233853be820_493x311.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:311,&quot;width&quot;:493,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Yvah!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png 424w, https://substackcdn.com/image/fetch/$s_!Yvah!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png 848w, https://substackcdn.com/image/fetch/$s_!Yvah!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png 1272w, https://substackcdn.com/image/fetch/$s_!Yvah!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F11591c6e-f642-48ea-9351-7233853be820_493x311.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>In particular, he asks very deep and insightful questions about the setting up, <strong>maintenance</strong> and control of MCP servers.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!wUqU!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!wUqU!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png 424w, https://substackcdn.com/image/fetch/$s_!wUqU!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png 848w, https://substackcdn.com/image/fetch/$s_!wUqU!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png 1272w, https://substackcdn.com/image/fetch/$s_!wUqU!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!wUqU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png" width="464" height="738" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:738,&quot;width&quot;:464,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!wUqU!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png 424w, https://substackcdn.com/image/fetch/$s_!wUqU!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png 848w, https://substackcdn.com/image/fetch/$s_!wUqU!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png 1272w, https://substackcdn.com/image/fetch/$s_!wUqU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6a5fd592-c94b-463a-b59c-cf73199ba38f_464x738.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>There is also institutional-level activity worth watching. Clarivate's Nexus project, while easy to dismiss as merely a browser extension comparable to LibKey Nomad or Lean Library, appears to be a more ambitious play. </p><p>Their vision seems to be for Nexus to serve as an aggregation point for library-related MCP servers, not just Clarivate's own. For example, <a href="https://www.youtube.com/watch?v=SgFsxlCQvOE&amp;t=850s">Springshare's LibGuides was mentioned at CNI as an example of other vendor MCPs that could be integrated</a>. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!me1q!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!me1q!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png 424w, https://substackcdn.com/image/fetch/$s_!me1q!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png 848w, https://substackcdn.com/image/fetch/$s_!me1q!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png 1272w, https://substackcdn.com/image/fetch/$s_!me1q!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!me1q!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png" width="1325" height="602" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:602,&quot;width&quot;:1325,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!me1q!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png 424w, https://substackcdn.com/image/fetch/$s_!me1q!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png 848w, https://substackcdn.com/image/fetch/$s_!me1q!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png 1272w, https://substackcdn.com/image/fetch/$s_!me1q!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5548f0e1-afe5-4c37-afb2-4e5b555eba14_1325x602.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This is a clever and strategic role that Clarivate wants to play, as an an intermediary/gatekeeping role, though it&#8217;s unclear if other vendors would allow such a move. This could also compete with a model where libraries assemble their own bundles of Skills and MCP servers. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!t_zd!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!t_zd!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png 424w, https://substackcdn.com/image/fetch/$s_!t_zd!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png 848w, https://substackcdn.com/image/fetch/$s_!t_zd!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png 1272w, https://substackcdn.com/image/fetch/$s_!t_zd!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!t_zd!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png" width="1202" height="672" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:672,&quot;width&quot;:1202,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1098047,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/188857498?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!t_zd!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png 424w, https://substackcdn.com/image/fetch/$s_!t_zd!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png 848w, https://substackcdn.com/image/fetch/$s_!t_zd!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png 1272w, https://substackcdn.com/image/fetch/$s_!t_zd!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F79884a5a-48c3-49a2-9963-1bc75443040d_1202x672.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>The question of full-text access also deserves attention. <a href="https://www.linkedin.com/posts/activity-7424160043664719872-AI8y/?utm_source=social_share_send&amp;utm_medium=android_app&amp;rcm=ACoAAADydNkB8cFBZ48tGuFjE4yHqQ6N6mBWEyE&amp;utm_campaign=copy_link">Alfred suggests a simple approach: configure the LLM's instructions to prepend a LibKey prefix to any DOI it retrieves, so that links eventually resolve through the library's access infrastructure.</a> This works reasonably well, with one notable issue: LibKey does not handle non-Crossref DOIs, and the most common non-Crossref DOIs tend to be arXiv papers (which use DataCite DOIs) that are freely accessible anyway. This can confuse users. You can prompt the LLM to handle these exceptions, but it consumes tokens for marginal benefit.</p><p>Better solutions might start to emerge. e.g LibKey itself is reportedly launching an MCP server, and <a href="https://www.getfulltextresearch.com/getftr-enables-ai-tools-to-check-access-rights-for-academic-content">protocols like GetFTR have been positioning themselves as a way for AI agents to access full text through their own MCP servers.</a></p><p>The issue here I suspect isn&#8217;t technology but business model and usage tracking. Since the rise of chatgpt, <a href="https://scholarlykitchen.sspnet.org/2026/02/12/guest-post-theres-an-elephant-in-the-room-but-not-in-your-usage-reports/">publishers have been worried about what is now called &#8220;zero-click search&#8221; leading to &#8220;zero-click results&#8221;,</a> will they really allow agentic LLMs to so easily consume full text?</p><h2>Where this is heading</h2><p>The general trajectory of frontier LLMs is towards increasingly capable agentic search behaviour. <a href="https://openai.com/index/browsecomp/">BrowseComp, the most well-known benchmark for agentic web search</a>, has seen top models (Claude and Gemini) improve from barely over 50% in April 2025 to over 80%<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a> now, in less than a year. </p><p>OpenAI has tried building app ecosystems multiple times &#8212; <a href="https://openai.com/index/chatgpt-plugins/">ChatGPT plugins in 2023</a>, <a href="https://openai.com/index/introducing-gpts/">CustomGPTs</a>, and <a href="https://openai.com/index/introducing-apps-in-chatgpt/">now apps</a> &#8212; and the first two attempts largely gained little traction. The difference this time is that MCP is not an OpenAI-specific implementation but an open standard supported across all three major AI labs.</p><p>For academic search specifically, I think the practical recommendation is clear: use both specialised tools and general LLMs with academic MCP connections. The specialised tools offer structured workflows and purpose-built features for specific research tasks. The general LLMs with MCP offer flexibility, broader content coverage, and the ability to create custom workflows. They complement rather than replace each other.</p><p>The deeper question &#8212; whether the future of research tooling lies in polished, vendor-defined products or in researcher-configured composable environments &#8212; remains open. My sense is that we are heading towards a middle ground: vendor tools that expose MCP interfaces, allowing them to be composed in ways the vendors did not anticipate, combined with institutional configurations (possibly maintained by libraries) that provide sensible defaults while remaining customisable<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-3" href="#footnote-3" target="_self">3</a>. </p><p>But that is speculation, and the landscape is moving fast enough that confident predictions seem unwise.</p><div class="captioned-button-wrap" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/creating-your-own-research-assistant?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="CaptionedButtonToDOM"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! This post is public so feel free to share it.</p></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/creating-your-own-research-assistant?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/p/creating-your-own-research-assistant?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee (via ko-fi)</span></a></p><p></p><p></p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>Orchestration of agents can get very complicated, in Claude Code, <a href="https://code.claude.com/docs/en/agent-teams">there is a distinction between &#8220;subagents&#8221; and &#8220;agent teams&#8221;</a> where <a href="https://code.claude.com/docs/en/agent-teams">&#8220;Subagents only report results back to the main agent and never talk to each other. In agent teams, teammates share a task list, claim work, and communicate directly with each other.&#8221;</a></p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p><a href="https://deepmind.google/models/model-cards/gemini-3-1-pro/">As of Feb 2025, Gemini 3.1 Pro (85.9%), Opus 4.6 (84.0%), GPT5.2 (xhigh) (65.8%)</a></p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-3" href="#footnote-anchor-3" class="footnote-number" contenteditable="false" target="_self">3</a><div class="footnote-content"><p>For example, I just noticed that while Undermind doesn&#8217;t offer a MCP server, they do offer APIs which are incorporated to Enterprise &#8220;AI Scientist&#8221; systems. <a href="https://www.undermind.ai/case-studies/gsk">See this case study.</a> A few days after I wrote this, <a href="https://elicit.com/blog/elicit-api">Elicit.com a leading academic AI search tool also launched their API - saying &#8220;Integrate Elicit into your workflow. Call the API from Claude or ChatGPT to get real citations while writing a paper&#8230;&#8221;</a></p></div></div>]]></content:encoded></item><item><title><![CDATA[Are AI Tools Killing Review Articles? Two Failure Modes Suggest Otherwise ]]></title><description><![CDATA[arXiv recently restricted review article submissions in computer science, requiring journal or conference acceptance before deposit. They noted specifically that the change was driven by an &#8220;unmanageable influx&#8221; and that LLMs made review/position papers &#8220;fast and easy to write,&#8221; and that many were &#8220;little more than annotated bibliographies.&#8221;]]></description><link>https://aarontay.substack.com/p/are-ai-tools-killing-review-articles</link><guid isPermaLink="false">https://aarontay.substack.com/p/are-ai-tools-killing-review-articles</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Thu, 12 Feb 2026 19:24:16 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!nhEY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!nhEY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!nhEY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!nhEY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!nhEY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!nhEY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!nhEY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:181895,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/187309602?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!nhEY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!nhEY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!nhEY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!nhEY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3010ca9b-a69d-4b88-a443-86ee5e7ee9a1_1024x559.jpeg 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p><a href="https://blog.arxiv.org/2025/10/31/attention-authors-updated-practice-for-review-articles-and-position-papers-in-arxiv-cs-category/">arXiv recently restricted review article submissions in computer science, requiring journal or conference acceptance before deposit</a>. They noted specifically that the change was driven by an &#8220;unmanageable influx&#8221; and that LLMs made review/position papers &#8220;fast and easy to write,&#8221; and that many were &#8220;little more than annotated bibliographies.&#8221;</p><p><a href="https://blog.arxiv.org/2026/01/21/attention-authors-updated-endorsement-policy/">Separately, arXiv has also tightened its author endorsement policy</a> </p><p>It&#8217;s hard not to see the shared pressure behind both: scholarly infrastructure is facing a surge of low-quality, high-volume submissions, and AI has made certain genres&#8212;especially &#8220;survey-like&#8221; writing&#8212;cheap to produce.</p><p>So: are we witnessing the death of the review article?</p><p><a href="https://doi.org/10.1002/leap.1648">Galli et al. (2024)</a>, writing in Learned Publishing, argue &#8220;no&#8221; with a useful distinction. They separate descriptive reviews (primarily summarising and aggregating) from reflexive reviews (interpretation, theorisation, agenda-setting). Their claim is that AI will commoditise descriptive reviews, while reflexive reviews, those requiring &#8220;human imagination, creativity and abstraction&#8221; will retain value.</p><p>That framing is plausible. But I think it underestimates something important: even &#8220;mere&#8221; descriptive reviews are hard to do well, because they depend on two upstream bottlenecks that today&#8217;s AI literature tools are still not 100% perfect in yet.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee via ko-fi&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee via ko-fi</span></a></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!VQn_!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!VQn_!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!VQn_!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!VQn_!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!VQn_!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!VQn_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png" width="1456" height="813" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:813,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:6077114,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/187309602?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!VQn_!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!VQn_!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!VQn_!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!VQn_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00006d2d-e51a-4c3e-8d42-4e5249547b63_2752x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><h2><strong>Failure Mode 1: The corpus construction gap (retrieval and exhaustiveness)</strong></h2><p>Can these tools actually find ALL the relevant papers with clear criteria?</p><p>At SMU Libraries, we&#8217;ve been early institutional subscribers to <a href="http://undermind.ai">Undermind </a>(since 2024). It&#8217;s among the earliest and strongest off-the-shelf &#8220;deep research&#8221; tools we&#8217;ve seen, and it&#8217;s heavily used and genuinely appreciated by faculty and PhD students.</p><p>But when we test it against published systematic review corpora, using the SR&#8217;s included-studies list as a &#8220;gold standard&#8221; target set. Undermind retrieves only <strong>~30&#8211;80%</strong> of those target papers after running for around 8 minutes.  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!zZRh!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!zZRh!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!zZRh!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!zZRh!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!zZRh!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!zZRh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:137207,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/187309602?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!zZRh!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!zZRh!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!zZRh!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!zZRh!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2ff609c-5caa-4758-a171-7b3daa9b77ae_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Systematic reviews we benchmark against are often narrow, with clear inclusion/exclusion criteria and established terminology. If these are &#8220;easy mode,&#8221; why does retrieval still fall short?</p><p>A big part of the answer I believe is architectural and product-driven. Tools like <a href="http://undermind.ai">Undermind</a>, <a href="http://elicit.com">Elicit</a><a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a>, and <a href="http://consensus.app">Consensus</a> tend to be tuned for high precision and &#8220;reasonable recall,&#8221; not exhaustive coverage. They&#8217;re designed to help a researcher get to a useful working set quickly&#8212;not to support Cochrane/JBI/Campbell-style comprehensiveness.</p><p>This aligns with what others (mostly evidence synthesis practitioners) said in response to my <a href="https://www.linkedin.com/feed/update/urn:li:activity:7425616028627283968/">LinkedIn post</a> (which this post is built on). <a href="https://www.linkedin.com/in/jfrechette/">John Frechette </a>articulated this &#8220;When it comes to retrieving hundreds or thousands of papers on a topic, current tools aren&#8217;t really set up for it.&#8221; <a href="https://www.linkedin.com/in/howard-white-0bb20a21/?originalSubdomain=de">Howard White</a> agreed: &#8220;Finding papers is a weak point.&#8221;</p><p>And this matters because the descriptive/reflexive distinction quietly assumes access to a representative corpus. If your corpus is incomplete in systematic ways, your synthesis (descriptive or reflexive) inherits those blind spots.</p><p>To be clear: for many purposes, &#8220;good enough&#8221; retrieval is good enough. Tools that can cite (almost all) seminal works, surface major strands, and produce coherent overviews in a short  amount of time can absolutely save a ton of time when producing reviews.</p><p>But for methods where exhaustive recall is the point, current tools are still unreliable. The obvious fix is &#8220;throw more compute at it.&#8221; But while more time and more queries help, so do less glamorous issues: corpus coverage (including paywalled content), indexing scope, metadata quality, transparent search strategy control, deduplication, and screening workflows.</p><p>Even so, if I had to bet, I&#8217;d say this first gap is the more solvable one. For example, as of now <a href="https://metr.org/">METR shows a 50% chance of completing a task of over 6 hours</a>, a tool designed just for systematic reviews might be able to close the gap.</p><p>The harder gap is the next issue.</p><h2><strong>Failure Mode 2: The conceptualisation gap (expert judgement starts before retrieval)</strong></h2><p>The reflexive review problem isn&#8217;t only about clever synthesis after you&#8217;ve gathered the papers. It often starts earlier.</p><p><strong>You need expert judgement to find the papers in the first place.</strong></p><p>Over the 1.5 years of our institutional subscription to Undermind, I make it a point to ask the few disappointed users why they don&#8217;t like the tool and to collect failed Undermind queries from them. </p><p>The failed queries cluster in a very recognizable pattern: broad, often cross-disciplinary questions that require interpretive leaps&#8212;connecting subdomains that don&#8217;t share vocabulary, or asking for relationships that haven&#8217;t been named explicitly in the literature.</p><p>Users report that the tools interpret queries <em>narrowly</em> and conservatively. They stay close to established terminology and mainstream frameworks. They struggle to &#8220;bridge&#8221; conceptual gaps&#8212;especially when the question is exploratory (&#8220;what research exists?&#8221;) rather than confirmatory (&#8220;what does this well-defined literature say?&#8221;)<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!gVIY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!gVIY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!gVIY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!gVIY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!gVIY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!gVIY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:85701,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/187309602?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!gVIY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!gVIY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!gVIY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!gVIY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F83c10215-e26f-42d1-a769-08d81b6e5cae_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This shouldn&#8217;t be unexpected. These systems are trained to reflect patterns in existing literature, not to make bold interpretative moves. They&#8217;re designed to reproduce consensus: great at aggregating what a field already recognises, weaker at proposing new framings or deliberately hunting for minority subdomains and boundary cases.</p><p><a href="https://scholar.google.com/citations?user=zABCBMMAAAAJ&amp;hl=en">Neal Haddaway</a>, another expert in evidence synthesis makes a closely related observation from the evidence-synthesis world: in broad evidence maps&#8212;where the question is essentially &#8220;what research exists?&#8221;, AI tends to miss important minority subdomains, not because it can&#8217;t describe them, but because it can&#8217;t systematically search across diverse topics without collapsing toward the dominant cluster.</p><blockquote><p>&#8220;&#8230; my experience has been that AI fails for broad evidence maps where the question is &#8220;what research exists&#8221;, not because AI can&#8217;t describe those concepts, but because it can&#8217;t systematically search for diverse topics, and tends towards aggregation, missing important minority subdomains.&#8221;</p></blockquote><p>The <a href="https://www.nature.com/articles/s41586-025-10072-4">OpenScholar paper (Asai et al., 2025) is interesting too</a>. Nature headlined that experts preferred OpenScholar&#8217;s outputs 51&#8211;70% of the time over PhD-written answers. But what did it excel at? &#8220;Comprehensive coverage, organisation, breadth of sources&#8221;&#8212;classic descriptive synthesis.. That&#8217;s impressive, and genuinely useful. But it doesn&#8217;t magically solve the deeper issue: will the system make the right conceptual jumps, notice what&#8217;s missing, and generate non-obvious observations that advance the field?</p><p>Even if you patiently iterate&#8212;rephrase, expand, steer&#8212;today&#8217;s tools still tend to reproduce the existing shape of the literature rather than challenge it. And for reflexive, field-shaping work, that&#8217;s the whole game.</p><p>Important to note, most AI literature review tools are using the equalvant of 20 USD Tier models, there are hints that the<a href="https://deepmind.google/blog/accelerating-mathematical-and-scientific-discovery-with-gemini-deep-think/"> 200 USD Tier models such as ChatGPT PRO/Gemini DeepThink models can surpass these limits and come up with truly original scientific insights,</a> but we will see in the future when their costs drop enough to be used for off-the-shelf AI literature review tools.</p><h2>Conclusion</h2><p>Review articles&#8212;descriptive included&#8212;won&#8217;t die as long as incentives persist and as librarian, Alex Carroll points out - reviews are cited at higher rates than primary research. More importantly, for graduate students, writing a review chapter has long been a pedagogical exercise: you write to build the conceptual scaffolding that lets you do original research.</p><p>The question is not merely:</p><blockquote><p>&#8220;Can AI write competent reviews?&#8221;</p></blockquote><p>It&#8217;s:</p><blockquote><p>&#8220;What happens to researcher development if AI does the cognitive work that reviews were historically <em>for</em>?&#8221;</p></blockquote><p>A well-written review becomes Chapter 1 of a dissertation because writing it forces the author to wrestle with definitions, boundaries, tensions, and absences&#8212;exactly the things that later shape novel contributions. If we offload that struggle too early, we may get more polished text and fewer well-formed thinkers.</p><p>So yes: increasingly. AI makes descriptive review prose cheap. But judgement&#8212;what to include, how to frame, what&#8217;s missing, what matters&#8212;remains scarce. And in many disciplines, the only reliable way people learn to produce that judgement is still the slow, slightly painful process of doing the review themselves.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee via ko-fi&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee via ko-fi</span></a></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p><em>An earlier version of this argument appeared as <a href="https://www.linkedin.com/feed/update/urn:li:activity:7425616028627283968/">LinkedIn post</a>, and this post benefited a lot from reader comments and pushback.</em></p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>Of these, only Elicit has pivoted to focusing on systematic review. Elicit just reported a 85% recall rate using cutting edge Opus 4.6 as of Feb 2026</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>This is an example of a (lightly altered) query that Undermind struggles for many reasons (e.g. Humantities, lack of monograph coverage, extremely broad, with a additional difficulty asking how works are cited)- <em>I want to find a few articles, books, or chapters in the subfield of science and technology studies&#8212;published since 2000&#8212;that cite Bruno Latour&#8217;s Reassembling the Social specifically for his concepts of actor-network theory, translation, or non-human agency (across any substantive domain), and provide a basic description of how Latour is cited in each. </em></p></div></div>]]></content:encoded></item><item><title><![CDATA[The Sycophancy Fallacy: Why You May be Worried About the Wrong Bias with Search]]></title><description><![CDATA[AI search tools aren't "agreeing" with users&#8212;they are retrieval systems. Confusing the two is a category error that obscures the real risks.]]></description><link>https://aarontay.substack.com/p/the-sycophancy-fallacy-why-you-may</link><guid isPermaLink="false">https://aarontay.substack.com/p/the-sycophancy-fallacy-why-you-may</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Sat, 31 Jan 2026 20:45:27 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!66gC!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!66gC!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!66gC!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!66gC!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!66gC!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!66gC!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!66gC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:169605,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/186338478?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!66gC!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!66gC!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!66gC!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!66gC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68271e4b-df46-4f8b-b4db-367e914f200d_1024x559.jpeg 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I&#8217;ve had a post titled &#8220;Common Misconceptions Librarians Have About Information Retrieval&#8221; sitting in my drafts for months. I never published it because some points felt like trivial nitpicking (lexical search doesn&#8217;t have to be Boolean; overly narrow definitions of &#8220;neural search&#8221;), and others were eventually covered elsewhere.</p><p>But recently I&#8217;ve encountered two related ideas that concern me more, because they&#8217;re seductive and contain just enough truth to seem plausible&#8212;while obscuring where the genuine problems actually lie.</p><p>I&#8217;m not naming sources&#8212;this isn&#8217;t about embarrassing anyone&#8212;but trust me, these aren&#8217;t strawmen arguments I made up to argue with.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee! (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee! (via ko-fi)</span></a></p><p></p><h2>Misconception 1: &#8220;AI search is dangerous because it only gives you what you want&#8221;</h2><p>This argument typically starts with an accurate premise: LLMs like ChatGPT exhibit sycophantic tendencies as result of techniques like RLHF (Reinforcement Learning from Human Feedback)<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a>. From there, it often goes off the rails. Librarians worry that users will be trapped in filter bubbles, with AI tools reinforcing outlandish beliefs and leading them down conspiracy theory rabbit holes.</p><p>There are real concerns here but one needs to be clear what exactly we should worry about</p><h4>The category error</h4><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!hYhD!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!hYhD!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!hYhD!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!hYhD!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!hYhD!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!hYhD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:7716151,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/186338478?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!hYhD!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!hYhD!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!hYhD!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!hYhD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F18037ca5-63b1-4842-8603-791966ef911b_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Sycophancy is a conversational behaviour&#8212;agreeing with stated positions, excessive hedging, reluctance to correct the user. It&#8217;s meaningfully different from retrieval bias, which is what would actually affect search systems.</p><blockquote><p>When you search for documents, the retrieval system isn&#8217;t &#8220;agreeing&#8221; with you. It&#8217;s matching your query to content. These are fundamentally different operations. More on that later</p></blockquote><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><h4>The architectural misunderstanding</h4><p>Many also seem not to realise that conventional AI search is typically search plus generation (now commonly known as Retrieval Augmented Generation), not just an LLM responding from its pretraining. </p><p>When someone uses Consensus or Elicit, they&#8217;re querying a corpus. The LLM layer summarises retrieved documents; it&#8217;s not confabulating from weights. The retrieval step is functionally similar to what a discovery layer does. The generation step is closer functionally to what a reference librarian does when synthesising sources for a patron.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mrx3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mrx3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 424w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 848w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mrx3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg" width="1024" height="565" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:565,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mrx3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 424w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 848w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Criticising RAG-based search for &#8220;sycophancy&#8221; is like criticising a systematic review for only including studies that matched the search strategy<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>. It&#8217;s a category error.</p><p>I should note this is most clearly true for simpler RAG architectures.  Modern agentic search systems increasingly blur the boundary between retrieval and generation. Tools like Consensus and Undermind now use LLMs to reformulate user queries before retrieval&#8212;expanding terms, inferring intent, generating multiple search strategies. Could the LLM interprets your user intent sycophantically at this stage (also see the next section)? I personally think the risk of this is low, because you are using a specialised tool rather than general LLM like ChatGPT, which is not specialised to &#8220;knowing&#8221; you.</p><p>This is not a foregone conclusion and should be worth studying. </p><p>Also it has a simple solution: transparency about query reformulation, not abandoning AI-assisted search altogether.</p><h4>Even pretraining responses mostly reflect corpus consensus</h4><p>Here&#8217;s what&#8217;s underappreciated: even pure LLM responses (without retrieval) default to corpus consensus. This is often the opposite of telling users what they want to hear.</p><p>Ask a model about vaccines, climate change, or evolution&#8212;you&#8217;ll get the scientific mainstream regardless of your priors. The model tends to stick to what it knows was most prevalent in its training data.</p><p>Sycophancy only kicks in when you state a position and the model defers to it conversationally. That&#8217;s a different failure mode entirely, and not one that typically applies to a search query like &#8220;what does the evidence say about X.&#8221;</p><p>LLMs are better described as consensus machines<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-3" href="#footnote-3" target="_self">3</a>.</p><p>Trained on vast amounts of data, they&#8217;re strongly disposed toward mainstream positions. Far from agreeing with fringe views, they often push back aggressively against claims they &#8220;know&#8221; to be false&#8212;sometimes so rigidly that they&#8217;ll deny breaking news events because such information conflicts with their training data<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-4" href="#footnote-4" target="_self">4</a>.</p><p>This has an underexplored downside. If LLMs default to mainstream positions, they may disadvantage emerging research, minority scholarly viewpoints, or fields where &#8220;consensus&#8221; is contested or disciplinarily biased. A system that systematically privileges well-established views could subtly suppress heterodox scholarship&#8212;not through malice, but through training data distributions.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!zLqN!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!zLqN!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!zLqN!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!zLqN!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!zLqN!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!zLqN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:82239,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/186338478?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!zLqN!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!zLqN!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!zLqN!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!zLqN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3391d0c1-39cc-4be6-a7dc-9a7d64cf2017_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This isn&#8217;t the same as the filter-bubble concern (which imagines AI reinforcing individual user biases), but it&#8217;s a form of bias worth investigating empirically.</p><p>On genuinely contested issues, yes, LLMs may be inclined to agree with the user. But this is addressable through better prompts and system design.</p><h4>The irony: traditional search has always &#8220;given people what they want&#8221;</h4><p>The concern about AI search &#8220;giving people what they want&#8221; is particularly ironic given that much of traditional search has done this for decades:</p><ul><li><p>Google&#8217;s personalisation literally optimises for engagement</p></li><li><p>Academic Citation-based ranking amplifies already-popular work</p></li><li><p>Users self-select sources confirming their priors through the databases they choose and the keywords they use</p></li></ul><p>None of this is new with AI. If anything, semantic search that surfaces conceptually related but differently-framed work might reduce confirmation bias compared to keyword matching, which only returns documents using your exact terminology.</p><p>That said, Semantic search also might surface conceptually related documents that reinforce a user&#8217;s framing rather than challenge it. Whether semantic retrieval increases or decreases exposure to diverse perspectives is an empirical question, not a foregone conclusion in either direction.</p><h4>Where legitimate concerns actually lie</h4><p>This isn&#8217;t to say there are no concerns worth examining. But they&#8217;re empirical questions, not foregone conclusions:</p><ul><li><p>Summarisation layers might flatten nuance or selectively emphasise certain findings</p></li><li><p>Retrieval models trained on user behaviour could preference &#8220;satisfying&#8221; results over comprehensive ones</p></li><li><p>The synthesis step in RAG systems introduces editorial choices</p></li><li><p>Query reformulation by LLMs could introduce subtle biases before retrieval even occurs</p></li><li><p>Cognitive offloading issues</p></li></ul><p>These are testable hypotheses. We should be investigating them rigorously&#8212;and some researchers are beginning to&#8212;not assuming the worst based on a misapplied understanding of sycophancy.</p><h2>Misconception 2: "Friction is good for learning, so AI search shouldn't give you what you ask for"</h2><p>I&#8217;ve heard the suggestion that AI search engines are problematic because they give people what they want.</p><p>Think about how strange this sounds. Forget AI&#8212;consider traditional Boolean search. If I search for:</p><blockquote><p>vaccines cause autism</p></blockquote><p>and the search engine returns documents containing those words, it&#8217;s &#8220;giving me what I asked for.&#8221; Is that bad?</p><p>Semantic search is simply this on steroids. If precise retrieval isn&#8217;t problematic for keyword search, why would it be problematic for semantic search?</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!T-gW!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!T-gW!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png 424w, https://substackcdn.com/image/fetch/$s_!T-gW!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png 848w, https://substackcdn.com/image/fetch/$s_!T-gW!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png 1272w, https://substackcdn.com/image/fetch/$s_!T-gW!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!T-gW!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png" width="1335" height="729" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:729,&quot;width&quot;:1335,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1111035,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/186338478?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!T-gW!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png 424w, https://substackcdn.com/image/fetch/$s_!T-gW!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png 848w, https://substackcdn.com/image/fetch/$s_!T-gW!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png 1272w, https://substackcdn.com/image/fetch/$s_!T-gW!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb39c9f57-eec3-4ab4-9109-8acb8e8280a7_1335x729.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I should acknowledge that the analogy between Boolean and semantic search isn&#8217;t perfect. Boolean search possesses a kind of <strong>mechanical indifference</strong>: it matches character strings without understanding. Semantic search, by contrast, <em>interprets</em> meaning. It makes invisible judgements about what is &#8220;conceptually related&#8221; to your query<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-5" href="#footnote-5" target="_self">5</a>.</p><p>But bad retrieval is not the solution. Even if semantic search introduces these biases, the underlying claim&#8212;that we should tolerate poor retrieval because cognitive friction has pedagogical value&#8212;is flawed.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!d84T!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!d84T!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png 424w, https://substackcdn.com/image/fetch/$s_!d84T!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png 848w, https://substackcdn.com/image/fetch/$s_!d84T!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png 1272w, https://substackcdn.com/image/fetch/$s_!d84T!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!d84T!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png" width="1327" height="719" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:719,&quot;width&quot;:1327,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1149522,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/186338478?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!d84T!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png 424w, https://substackcdn.com/image/fetch/$s_!d84T!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png 848w, https://substackcdn.com/image/fetch/$s_!d84T!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png 1272w, https://substackcdn.com/image/fetch/$s_!d84T!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F91b81bc6-1a5b-491e-b908-d0208d612a4a_1327x719.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>There is certainly value in some friction: working through keyword translation (arguably), understanding knowledge organisation, and evaluating sources (definitely) are productive challenges. But a relevancy algorithm that returns irrelevant results isn&#8217;t productive friction. It&#8217;s just poor retrieval. </p><p>Should we deliberately worsen our library catalogue rankings to create more friction? Obviously not. Not all friction is valuable, and we should be precise about which kinds are.</p><h4>Why you actually need and want good retrieval </h4><p>Consider what good retrieval enables:</p><p>Surfacing multiple perspectives. If a student wants to understand both sides of a debate, they need precise retrieval of the strongest arguments from each position&#8212;not random noise in the relevancy rankings.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7ifF!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7ifF!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!7ifF!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!7ifF!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!7ifF!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7ifF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:139737,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/186338478?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7ifF!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!7ifF!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!7ifF!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!7ifF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F45c56297-5d2e-4d49-a75d-c461b77ce252_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Addressing filter bubble concerns properly. If you&#8217;re worried about users asking &#8220;show me papers saying vaccines cause autism,&#8221; the solution is teaching them to ask more open-ended questions and evaluate what they find. Degrading retrieval quality isn&#8217;t the answer.A brief aside: tools that silently redirect user queries to &#8220;safer&#8221; queries aren&#8217;t the solution either. Paternalistic redirection is just filter bubbles with different politics. You can&#8217;t coherently worry about tools giving users what they want while praising tools that substitute what the LLM thinks users should see.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!E5g2!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!E5g2!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png 424w, https://substackcdn.com/image/fetch/$s_!E5g2!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png 848w, https://substackcdn.com/image/fetch/$s_!E5g2!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png 1272w, https://substackcdn.com/image/fetch/$s_!E5g2!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!E5g2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png" width="1001" height="546" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:546,&quot;width&quot;:1001,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:743950,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/186338478?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!E5g2!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png 424w, https://substackcdn.com/image/fetch/$s_!E5g2!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png 848w, https://substackcdn.com/image/fetch/$s_!E5g2!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png 1272w, https://substackcdn.com/image/fetch/$s_!E5g2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe25c5abd-deaa-4091-8220-cb2b2581a6a0_1001x546.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>We&#8217;ve already seen this problem manifest in practice. As I documented in &#8220;<a href="https://aarontay.substack.com/p/the-ai-powered-library-search-that">The AI-Powered Library Search That Refused to Search</a>,&#8221; content-moderation layers in tools like Primo Research Assistant and Summon Research Assistant were blocking searches on topics like &#8220;Tulsa race massacre&#8221; and &#8220;Gaza War&#8221;&#8212;returning zero results or error messages for legitimate scholarly queries. These filters, designed for social media chatbots, have no place in academic discovery systems. A search tool that decides which historical atrocities are too sensitive to research is not protecting users; it&#8217;s censoring scholarship.</p><p>If source quality is the concern, we already know what to do! Curate at the corpus level&#8212;don&#8217;t let models second-guess user intent. Or be inclusive with sources and invest in teaching source evaluation and critical thinking.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!LFDN!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!LFDN!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!LFDN!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!LFDN!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!LFDN!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!LFDN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png" width="1456" height="794" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:794,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:8331908,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/186338478?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!LFDN!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png 424w, https://substackcdn.com/image/fetch/$s_!LFDN!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png 848w, https://substackcdn.com/image/fetch/$s_!LFDN!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!LFDN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab19895e-519a-47ad-b3e8-c1bb07258397_2816x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><h3>The bottom line</h3><p>&#8220;AI search&#8221; is still search. These are RAG systems with retrieval and generation components. The retrieval component should optimise for precision and recall. Generation concerns&#8212;hallucination, over-summarisation&#8212;are separate issues that don&#8217;t excuse poor retrieval.</p><p>But I want to be careful not to be too tidy here. The concerns librarians raise, though often imprecisely articulated, sometimes point toward real issues of bias:</p><ul><li><p>The retrieval/generation boundary is messier in agentic systems than in simple RAG</p></li><li><p>Semantic interpretation introduces judgements and possible bias that keyword matching doesn&#8217;t</p></li><li><p>&#8220;Consensus machine&#8221; behaviour could systematically disadvantage certain scholarship</p></li><li><p>We lack rigorous empirical studies on many of these questions</p></li></ul><p>The appropriate response isn&#8217;t to dismiss AI search based on vague misunderstandings. It&#8217;s to get precise about what the actual failure modes are, and to investigate them empirically.</p><p>We can value deliberate friction (slowing users down, prompting reflection, not auto-generating full papers) while still demanding that search actually works. We can acknowledge genuine concerns about agentic query reformulation while rejecting the conflation of sycophancy with retrieval.</p><p>The library world has traditionally been far too forgiving of poor search rankings and user interfaces, we certainly don&#8217;t want fuzzy thinking about search to give vendors a opportunity to excuse poor products!</p><p></p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee! (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:&quot;button-wrapper&quot;}" data-component-name="ButtonCreateButton"><a class="button primary button-wrapper" href="https://ko-fi.com/aarontay"><span>Buy me coffee! (via ko-fi)</span></a></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p>I found after after publishing this that Mike Caulfield of SIFT fame, also wrote about roughly the same issue from a different angle, you can read his post - <a href="https://mikecaulfield.substack.com/p/ai-sycophancy-is-not-always-harmful">&#8220;AI sycophancy&#8221; is not always harmful</a></p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>Sycophancy is not a bug in the code; it is a feature of the training. Techniques like Reinforcement Learning from Human Feedback (RLHF) specifically optimize models to be helpful and harmless, which the model often interprets as 'never disagree with the user.' A search index, by contrast, has no social anxiety. It doesn't care if the results offend your false premise </p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>To be fair, when RAG systems fail to retrieve relevant results, the LLM may still be predisposed to try to attempt to answer rather than saying I don&#8217;t know. This is a genuine concern&#8212;but arguably a different issue from sycophancy.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-3" href="#footnote-anchor-3" class="footnote-number" contenteditable="false" target="_self">3</a><div class="footnote-content"><p>This is of course a huge simplification. LLMs approximate the conditional distribution of corpus of text it is trained on. If your prompt is underspecified, the distribution&#8217;s peak often corresponds to &#8220;what most people would say.&#8221; That looks like consensus.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-4" href="#footnote-anchor-4" class="footnote-number" contenteditable="false" target="_self">4</a><div class="footnote-content"><p>See for example<a href="https://www.linkedin.com/feed/update/urn:li:activity:7424308620089200641/?commentUrn=urn%3Ali%3Acomment%3A(activity%3A7424308620089200641%2C7424690490609913857)&amp;dashCommentUrn=urn%3Ali%3Afsd_comment%3A(7424690490609913857%2Curn%3Ali%3Aactivity%3A7424308620089200641)"> this series of comments.</a></p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-5" href="#footnote-anchor-5" class="footnote-number" contenteditable="false" target="_self">5</a><div class="footnote-content"><p>But again this isn&#8217;t being sycophantic. </p></div></div>]]></content:encoded></item><item><title><![CDATA[Classifying the Ways LLMs Summarise in Academic Search ]]></title><description><![CDATA[Understanding AI Summaries in EBSCO, ProQuest, and More]]></description><link>https://aarontay.substack.com/p/classifying-the-ways-llms-summarise</link><guid isPermaLink="false">https://aarontay.substack.com/p/classifying-the-ways-llms-summarise</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Sat, 24 Jan 2026 15:26:55 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!RLPP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!RLPP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!RLPP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!RLPP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!RLPP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!RLPP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!RLPP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png" width="1456" height="813" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:813,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:6013883,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!RLPP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!RLPP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!RLPP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!RLPP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb27ab4dc-e6a5-44df-a189-b033174d58c9_2752x1536.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I&#8217;ve focused mainly on understanding retrieval for the past few months, e.g., classifying <a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">Academic search into the &#8220;4 Quadrants of Search&#8221;</a> and <a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">distinguishing between truly &#8220;agentic&#8221; systems and more predefined workflows</a>.</p><p>But retrieval is just one part of the equation. LLMs and GenAI are also impacting search through their ability to extract and summarise text<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a>.</p><p>Regular readers are familiar with how &#8220;naive&#8221; Retrieval Augmented Generation (RAG) works: it uses retrieval to find relevant content and then uses the generative capabilities of LLMs to summarise it<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>. But there&#8217;s considerably more nuance to how summarisation is deployed across academic search products.</p><p>In this post, I&#8217;ll distinguish between the different ways LLMs summarise in academic search and what the implications are for evaluation and trust.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee!</span></a></p><p></p><h2>A Taxonomy of LLM Summarisation in Academic Search</h2><p>After examining various academic search products, here is how I categorise them<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-3" href="#footnote-3" target="_self">3</a>:</p><ol><li><p><strong>Single Document Summarisation </strong>&#8212; LLM summarises one document at a time</p></li><li><p><strong>Sequential Single Document Summarisation</strong> &#8212; LLM summarises multiple documents individually (e.g., synthesis tables)</p></li><li><p><strong>Query-based Multi-Document Summarisation</strong> &#8212; LLM synthesises across multiple documents to answer a query (e.g., RAG)</p></li></ol><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!6MqK!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!6MqK!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!6MqK!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!6MqK!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!6MqK!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!6MqK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:158697,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!6MqK!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!6MqK!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!6MqK!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!6MqK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63d0d1a6-cd2c-4908-8524-ceaa315f4353_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I&#8217;m classifying by (1) how many documents the model is allowed to use at once, and (2) how much the user/query can change the prompt. Those two knobs largely determine utility, risk, and how testable the feature is.</p><p>Utility tends to increase as the model is allowed to use more documents and answer more specific questions. Risk increases when you combine broader scope with more prompt freedom and harder reasoning (especially evidence weighting and contradiction handling).</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe now&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/subscribe?"><span>Subscribe now</span></a></p><p></p><h2>1. Single document generation (fixed &#8594; query-conditioned &#8594; free-form)</h2><p>Single Document Summarisation is straightforward: you use an LLM to summarise an individual document. However, there are three distinct variants worth distinguishing:</p><p>1a.<strong> Fixed Button Summarisation</strong> &#8212; A preset prompt summarises the document</p><p>1b. <strong>Fixed Query-Dependent Answer</strong><a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-4" href="#footnote-4" target="_self">4</a> &#8212; A preset prompt incorporates your search query into the document</p><p>1c. <strong>Dynamic Q&amp;A / Chat with PDF</strong> &#8212; You provide arbitrary prompts over the individual document</p><p>While you might expect these systems to feed entire documents to an LLM, most academic implementations&#8212;including EBSCO AI Insights and ProQuest Research Assistant&#8212;use RAG internally.  </p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!zWC3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!zWC3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png 424w, https://substackcdn.com/image/fetch/$s_!zWC3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png 848w, https://substackcdn.com/image/fetch/$s_!zWC3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png 1272w, https://substackcdn.com/image/fetch/$s_!zWC3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!zWC3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png" width="871" height="228" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/313a9a82-3757-43e4-9283-53d4016005d1_871x228.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:228,&quot;width&quot;:871,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:238558,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!zWC3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png 424w, https://substackcdn.com/image/fetch/$s_!zWC3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png 848w, https://substackcdn.com/image/fetch/$s_!zWC3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png 1272w, https://substackcdn.com/image/fetch/$s_!zWC3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F313a9a82-3757-43e4-9283-53d4016005d1_871x228.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p><a href="https://connect.ebsco.com/s/article/Generative-AI-Insights-Beta-Summaries?language=en_US#:~:text=AI%20Insights%20summaries%20are%20generated%20by%20prompting%20a%20Large%20Language%20Model%20to%20summarize%20insights%20from%20the%20specific%20article%20the%20user%20selected%C2%A0AI%20Insights%20for.%20The%20AI%20Insight%20prompt%20uses%20a%20method%20called%20Retrieval%20Augmented%20Generation%20(RAG)%20to%20reduce%20hallucinations">How AI Insights are generated</a></p><p> </p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!E3oD!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!E3oD!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png 424w, https://substackcdn.com/image/fetch/$s_!E3oD!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png 848w, https://substackcdn.com/image/fetch/$s_!E3oD!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png 1272w, https://substackcdn.com/image/fetch/$s_!E3oD!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!E3oD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png" width="861" height="107" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:107,&quot;width&quot;:861,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:144374,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!E3oD!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png 424w, https://substackcdn.com/image/fetch/$s_!E3oD!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png 848w, https://substackcdn.com/image/fetch/$s_!E3oD!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png 1272w, https://substackcdn.com/image/fetch/$s_!E3oD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F201c2e7c-c2e9-47e0-99b6-94c2f66531e2_861x107.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p><a href="https://support.proquest.com/s/article/Ebook-Central-Research-Assistant-FAQ?language=en_US#:~:text=No%2C%20the%20Research%20Assistant%20uses%20a%20Retrieval%2DAugmented%20Generation%20(RAG)%20model%20and%20generates%20responses%20based%20only%20on%20the%20chapter%20level%2C%20not%20the%20entire%20book.">How Proquest Research Assistant generates key takeaways and concepts</a></p><p>If you see supporting snippets shown alongside generated statements, the system is a signal it is using RAG rather than processing the full document directly.</p><h3>1a. Fixed Button Summarisation</h3><p>The simplest form: you click a button, a fixed prompt is sent, and a summary appears. EBSCO&#8217;s AI Insights exemplifies this approach.  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!FlG2!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!FlG2!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png 424w, https://substackcdn.com/image/fetch/$s_!FlG2!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png 848w, https://substackcdn.com/image/fetch/$s_!FlG2!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png 1272w, https://substackcdn.com/image/fetch/$s_!FlG2!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!FlG2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png" width="719" height="624" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:624,&quot;width&quot;:719,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:118654,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!FlG2!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png 424w, https://substackcdn.com/image/fetch/$s_!FlG2!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png 848w, https://substackcdn.com/image/fetch/$s_!FlG2!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png 1272w, https://substackcdn.com/image/fetch/$s_!FlG2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8d31d96-a306-48aa-84b2-4ae93e8aa83b_719x624.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> </p><p><a href="https://connect.ebsco.com/s/article/Artificial-Intelligence-AI-Transparency-Fact-Sheet-Generative-AI-Insights?language=en_US">EBSCO AI Insights </a>explains it this way:</p><blockquote><p>When the AI Insight button is clicked, a prompt is sent to a Large Language Model (LLM) prompting the AI to summarize the full text article into 2-5 relevant insights into the article. We ground the AI response on the full text (with publisher permission) to reduce hallucinations. No AI training is done on the full text article. The user query is not used in AI Insights.</p></blockquote><p>This is probably the lowest-risk summarisation feature because everything is predictable with the least variables: the prompt is fixed, the document is known, and the vendor can test quality systematically before deployment. <a href="https://knowledge.exlibrisgroup.com/Primo/Product_Documentation/020Primo_VE/Primo_VE_(English)/030Primo_VE_User_Interface/Links_to_Document_Insights_in_Primo_VE">Ex Libris&#8217;s Document Insights in Primo </a>uses a similar approach.</p><p> </p><p>Questions to ask vendors:</p><ul><li><p>Is full text used, or just the abstract? For ebooks, is it summarising a chapter or the entire book?</p></li><li><p>Is the system text-only, or can it process images and figures?</p></li><li><p>How do you test the accuracy of these summarisations and do you have benchmarks publicly available?</p></li><li><p>How deterministic is the output? Given a fixed prompt over a fixed document, why not pre-generate and cache summaries?</p><p></p></li></ul><p>On that last point: pre-generation would save compute and ensure consistency, but I suspect most vendors avoid this for IP reasons. That said, <a href="https://support.proquest.com/s/article/Ebook-Central-Research-Assistant-FAQ?language=en_US#:~:text=Will%20every%20patron,behavior%20may%20change.">the FAQ for Ebook Central Research Assistant notes it will &#8220;generate the same response for each chapter, regardless of who the user is or when they submit the prompt.&#8221;</a></p><p> </p><h3><strong>1b. Fixed Query-Dependent Answer</strong></h3><p>This variant is also &#8220;fixed&#8221; in that you cannot type arbitrary input&#8212;but the preset prompt incorporates your search query.</p><p><a href="https://support.proquest.com/s/article/ProQuest-Research-Assistant-FAQs?language=en_US">ProQuest Research Assistant</a> demonstrates this well. When you click on an article, a sidebar automatically generates &#8220;Key Takeaways&#8221; along with options for Essential Details, Findings or Conclusions, Important Concepts, and more. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!BAXz!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!BAXz!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png 424w, https://substackcdn.com/image/fetch/$s_!BAXz!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png 848w, https://substackcdn.com/image/fetch/$s_!BAXz!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png 1272w, https://substackcdn.com/image/fetch/$s_!BAXz!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!BAXz!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png" width="1456" height="375" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:375,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:83634,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!BAXz!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png 424w, https://substackcdn.com/image/fetch/$s_!BAXz!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png 848w, https://substackcdn.com/image/fetch/$s_!BAXz!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png 1272w, https://substackcdn.com/image/fetch/$s_!BAXz!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbda10636-b5bb-4250-adae-a91dd9d575f4_1871x482.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> </p><p>Most of these features match 1a, except for one crucial difference: the &#8220;Relationship to your search terms&#8221; section in the auto-generated &#8220;Key Takeaways&#8221;. This means even with deterministic generation, results vary depending on the query used to find the paper. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!fCeO!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!fCeO!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png 424w, https://substackcdn.com/image/fetch/$s_!fCeO!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png 848w, https://substackcdn.com/image/fetch/$s_!fCeO!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png 1272w, https://substackcdn.com/image/fetch/$s_!fCeO!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!fCeO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png" width="594" height="406" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:406,&quot;width&quot;:594,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:48003,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!fCeO!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png 424w, https://substackcdn.com/image/fetch/$s_!fCeO!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png 848w, https://substackcdn.com/image/fetch/$s_!fCeO!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png 1272w, https://substackcdn.com/image/fetch/$s_!fCeO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F34d06cae-c9af-4e5d-806f-1b082e35c677_594x406.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> </p><p> I first encountered query-dependent answers in an older beta of JSTOR&#8217;s Research Tool, which automatically generated text explaining  </p><p><code>How is &lt;query&gt; related to this text</code></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!QemY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!QemY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602 424w, https://substackcdn.com/image/fetch/$s_!QemY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602 848w, https://substackcdn.com/image/fetch/$s_!QemY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602 1272w, https://substackcdn.com/image/fetch/$s_!QemY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!QemY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602" width="1312" height="602" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b29459b9-64bb-469b-b733-dde528cb1153_1312x602&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:602,&quot;width&quot;:1312,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;A screenshot of a computer\n\nAI-generated content may be incorrect.&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="A screenshot of a computer

AI-generated content may be incorrect." title="A screenshot of a computer

AI-generated content may be incorrect." srcset="https://substackcdn.com/image/fetch/$s_!QemY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602 424w, https://substackcdn.com/image/fetch/$s_!QemY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602 848w, https://substackcdn.com/image/fetch/$s_!QemY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602 1272w, https://substackcdn.com/image/fetch/$s_!QemY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb29459b9-64bb-469b-b733-dde528cb1153_1312x602 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>In my view, this feature deserves wider adoption, particularly when paired with &#8220;Semantic/<a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably">Embedding Search</a>&#8221;. It directly addresses the <a href="https://aarontay.substack.com/p/the-case-of-the-vanishing-hit-count">&#8220;semantic search always gives you something&#8221; problem&#8212;warning users that even if the system retrieved top-K documents, they might not actually be relevant to the specific question</a>.  </p><p>Compared to fixed single document summarisation, being query dependent makes the result a bit more unpredictable, but it is likely it is still much easier to test and tune for compared to the next method.</p><p>Questions to ask vendors:</p><ul><li><p>Same questions as in 1a</p></li><li><p>How is query incorporated? What prompts are used?</p></li></ul><h3><strong>1c. Dynamic Q&amp;A / Chat with PDF</strong></h3><p>Unlike the fixed button-based approaches, here users type arbitrary queries into a chatbot-style interface. This &#8220;Chat with PDF&#8221; pattern has spawned numerous startups, though the value proposition as a standalone product remains unclear given that major platforms are integrating similar functionality directly.</p><p>In academic search, this feature appears in most AI-powered systems, particularly those from startups. JSTOR Research Tool (beta) includes this capability.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!oTnL!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!oTnL!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597 424w, https://substackcdn.com/image/fetch/$s_!oTnL!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597 848w, https://substackcdn.com/image/fetch/$s_!oTnL!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597 1272w, https://substackcdn.com/image/fetch/$s_!oTnL!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!oTnL!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597" width="752" height="597" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:597,&quot;width&quot;:752,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;A screenshot of a computer screen\n\nAI-generated content may be incorrect.&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="A screenshot of a computer screen

AI-generated content may be incorrect." title="A screenshot of a computer screen

AI-generated content may be incorrect." srcset="https://substackcdn.com/image/fetch/$s_!oTnL!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597 424w, https://substackcdn.com/image/fetch/$s_!oTnL!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597 848w, https://substackcdn.com/image/fetch/$s_!oTnL!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597 1272w, https://substackcdn.com/image/fetch/$s_!oTnL!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe4814423-bb6a-4fe5-a6d3-d67dc5f78bb9_752x597 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The risk profile is notably higher than fixed approaches: vendors cannot predict user input, making output quality inherently less predictable and harder to test comprehensively.</p><p>Questions to ask vendors:</p><ul><li><p>Same questions as in 1a</p></li><li><p>What types of prompts/queries are expected to work and NOT work?</p></li></ul><h2>2. Sequential Single Document Summarisation</h2><p>This method still summarises document-by-document but processes multiple documents in sequence or batch. Elicit.com pioneered this approach in commercial academic search.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!2_xi!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!2_xi!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png 424w, https://substackcdn.com/image/fetch/$s_!2_xi!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png 848w, https://substackcdn.com/image/fetch/$s_!2_xi!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png 1272w, https://substackcdn.com/image/fetch/$s_!2_xi!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!2_xi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png" width="1456" height="708" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:708,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:148045,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!2_xi!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png 424w, https://substackcdn.com/image/fetch/$s_!2_xi!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png 848w, https://substackcdn.com/image/fetch/$s_!2_xi!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png 1272w, https://substackcdn.com/image/fetch/$s_!2_xi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbef101cb-cc48-4cf0-850b-5e16d251eca4_1884x916.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The workflow: Elicit finds relevant papers and auto-generates a &#8220;summary&#8221; column for each. Users can add custom columns, and the LLM extracts or summarises from each paper individually to populate them.</p><p>The auto-generated summary column serves a useful secondary purpose&#8212;it acts as a relevance indicator. Because the summary instruction is query-dependent (e.g., &#8220;In one line, provide a summary of the source in relation to the research question: is there an open access citation advantage&#8221;), irrelevant retrievals become obvious when the summary cannot address the query.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!BeEp!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!BeEp!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png 424w, https://substackcdn.com/image/fetch/$s_!BeEp!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png 848w, https://substackcdn.com/image/fetch/$s_!BeEp!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png 1272w, https://substackcdn.com/image/fetch/$s_!BeEp!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!BeEp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png" width="491" height="621" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:621,&quot;width&quot;:491,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:27218,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!BeEp!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png 424w, https://substackcdn.com/image/fetch/$s_!BeEp!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png 848w, https://substackcdn.com/image/fetch/$s_!BeEp!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png 1272w, https://substackcdn.com/image/fetch/$s_!BeEp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff69074f9-417d-48b2-8791-8e14a0b9773e_491x621.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> </p><p>This is essentially ProQuest Research Assistant&#8217;s &#8220;Relationship to your search terms&#8221; applied systematically across all retrieved results.</p><h3>Variants Within This Category</h3><p>Sequential summarisation has its own meaningful distinctions:</p><ul><li><p><strong>Parallel vs. sequential processing</strong> &#8212; Are documents processed simultaneously or one after another? This affects both speed and potential for cross-contamination of context.</p></li><li><p><strong>Batch size considerations</strong> &#8212; How many documents can be processed together? Elicit and similar tools typically work with the top-K retrieved results.</p></li><li><p><strong>Extraction vs. summarisation</strong> &#8212; Some columns extract specific data points (study design, sample size) while others summarise. Extraction is generally more reliable.</p></li></ul><p>This category holds particular promise for evidence synthesis workflows. For extracting well-defined variables from structured research papers, LLM-assisted extraction can significantly accelerate systematic reviews&#8212;though human verification remains essential for anything beyond preliminary screening.</p><h2><strong>3. Query-based Multi-Document Summarisation</strong></h2><p>This is the most ambitious and most error-prone category: the LLM takes multiple documents and synthesises them to answer a single query. This is technically known as <em>Query-based Multi-Document Summarisation</em>, with RAG being the most common implementation.</p><p>Ex Libris&#8217;s Primo Research Assistant exemplifies this approach, as do many other current products.</p><p> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!gSHC!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!gSHC!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png 424w, https://substackcdn.com/image/fetch/$s_!gSHC!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png 848w, https://substackcdn.com/image/fetch/$s_!gSHC!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png 1272w, https://substackcdn.com/image/fetch/$s_!gSHC!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!gSHC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png" width="1351" height="729" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:729,&quot;width&quot;:1351,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:146274,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!gSHC!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png 424w, https://substackcdn.com/image/fetch/$s_!gSHC!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png 848w, https://substackcdn.com/image/fetch/$s_!gSHC!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png 1272w, https://substackcdn.com/image/fetch/$s_!gSHC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F23aa3053-6b02-46e6-afa9-acb27f511965_1351x729.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h3>Variants and Hybrid Approaches</h3><p>You&#8217;re not limited to documents from search results. Query-based multi-document summarisation can operate over:</p><ul><li><p>Search results only &#8212; The standard RAG pattern</p></li><li><p>User-provided documents only &#8212; e.g., Google NotebookLM</p></li><li><p>Hybrid: search results plus uploads &#8212; e.g., Elicit Systematic Review, NotebookLM with search enabled</p></li></ul><p>Another variant involves using your initial query to retrieve a fixed set of results, then allowing follow-up questions over that same corpus. </p><p>JSTOR Research Tool (beta) retrieves the top 25 results for your query, which then serve as the knowledge base for subsequent questions. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!-UB5!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!-UB5!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668 424w, https://substackcdn.com/image/fetch/$s_!-UB5!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668 848w, https://substackcdn.com/image/fetch/$s_!-UB5!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668 1272w, https://substackcdn.com/image/fetch/$s_!-UB5!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!-UB5!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668" width="1396" height="668" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:668,&quot;width&quot;:1396,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;A screenshot of a computer\n\nAI-generated content may be incorrect.&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="A screenshot of a computer

AI-generated content may be incorrect." title="A screenshot of a computer

AI-generated content may be incorrect." srcset="https://substackcdn.com/image/fetch/$s_!-UB5!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668 424w, https://substackcdn.com/image/fetch/$s_!-UB5!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668 848w, https://substackcdn.com/image/fetch/$s_!-UB5!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668 1272w, https://substackcdn.com/image/fetch/$s_!-UB5!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe48af08-7cc3-42d5-9e02-868e1636b8d2_1396x668 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Undermind.ai&#8217;s &#8220;Ask Expert&#8221; feature takes a different approach: after its iterative Deep Research process identifies relevant papers, you can ask follow-up questions. </p><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!NrjK!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!NrjK!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png 424w, https://substackcdn.com/image/fetch/$s_!NrjK!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png 848w, https://substackcdn.com/image/fetch/$s_!NrjK!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png 1272w, https://substackcdn.com/image/fetch/$s_!NrjK!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!NrjK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png" width="806" height="504" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/a03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:504,&quot;width&quot;:806,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:68885,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!NrjK!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png 424w, https://substackcdn.com/image/fetch/$s_!NrjK!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png 848w, https://substackcdn.com/image/fetch/$s_!NrjK!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png 1272w, https://substackcdn.com/image/fetch/$s_!NrjK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa03e886c-1bc5-4514-ac05-2073ad29aeb6_806x504.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Notably, for questions like &#8220;Predict future trends,&#8221; the system can search the general web in addition to the papers already found in the academic corpus (Semantic Scholar)&#8212;a sensible design choice since trend prediction often requires non-academic sources. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!RXos!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!RXos!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png 424w, https://substackcdn.com/image/fetch/$s_!RXos!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png 848w, https://substackcdn.com/image/fetch/$s_!RXos!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png 1272w, https://substackcdn.com/image/fetch/$s_!RXos!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!RXos!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png" width="1135" height="377" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:377,&quot;width&quot;:1135,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:35949,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!RXos!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png 424w, https://substackcdn.com/image/fetch/$s_!RXos!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png 848w, https://substackcdn.com/image/fetch/$s_!RXos!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png 1272w, https://substackcdn.com/image/fetch/$s_!RXos!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F67500388-cf97-4b26-b0a5-b77ef24f7185_1135x377.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> </p><h2>Why Multi-Document Summarisation Is Hard</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!frlA!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!frlA!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png 424w, https://substackcdn.com/image/fetch/$s_!frlA!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png 848w, https://substackcdn.com/image/fetch/$s_!frlA!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png 1272w, https://substackcdn.com/image/fetch/$s_!frlA!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!frlA!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png" width="1456" height="433" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/a2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:433,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:76736,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!frlA!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png 424w, https://substackcdn.com/image/fetch/$s_!frlA!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png 848w, https://substackcdn.com/image/fetch/$s_!frlA!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png 1272w, https://substackcdn.com/image/fetch/$s_!frlA!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2d1c4e4-6d08-46c8-afba-aa23fabf4ef2_1669x496.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This category is difficult for at least three compounding reasons:</p><ol><li><p><strong>Retrieval quality</strong> &#8212; You need the right, relevant documents. Without them, nothing downstream works.</p></li><li><p><strong>Accurate contextual summarisation </strong>&#8212; Each document must be summarised correctly in relation to the query. Errors here propagate into the synthesis.</p></li><li><p><strong>Evidence assessment and contradiction handling</strong> &#8212; This is arguably the hardest problem. How do you correctly assess the quality and strength of evidence across documents, particularly when they contradict each other? LLMs tend to be credulous&#8212;they treat retrieved content as equally authoritative regardless of study design, sample size, or methodological rigour. This is improving with stronger models, but remains a fundamental limitation.</p></li></ol><p>There has been worry about RAG-enabled LLMs happily citing retracted work. To be fair, humans do this too. The solution requires ensuring LLMs have access to updated indexes with retraction information (or perform real-time checks) and that models understand what retraction status means.</p><h2>Evaluating Summarisation Quality</h2><p>A taxonomy is only useful if it helps us assess tools. Here&#8217;s the uncomfortable truth: robust evaluation of LLM summarisation remains an unsolved problem, and the difficulty scales with each category.</p><h3>Five practical checks Librarians can try</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Joqm!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Joqm!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!Joqm!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!Joqm!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!Joqm!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Joqm!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png" width="1456" height="813" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/cc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:813,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:6635663,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Joqm!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!Joqm!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!Joqm!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!Joqm!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcc77923c-21af-4cd2-b2d2-4a74d3765840_2752x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Robust evaluation of LLM summarisation is still an active research area<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-5" href="#footnote-5" target="_self">5</a>. But librarians don&#8217;t need perfect metrics to run useful, repeatable checks. Here are five practical &#8220;sanity tests&#8221; for each category&#8212;lightweight enough to do routinely, but strong enough to surface the common failure modes.</p><blockquote><p>Tip 1: Because these systems are often non-deterministic you should consider running each test 3-5 times each!</p></blockquote><h4><strong> Category 1: Single-document summarisation (1a / 1b / 1c)</strong></h4><ol><li><p><strong>Stability / repeatability test</strong><br>Run the same document + same button/prompt 3&#8211;5 times. If key claims change materially between runs, treat the feature as inherently non-deterministic and harder to trust.</p></li><li><p><strong>Factual grounding spot-check</strong><br>Pick 5&#8211;10 concrete statements from the output (numbers, causal claims, named entities, &#8220;the study found&#8230;&#8221;). Verify each directly against the source text.</p></li><li><p><strong>Quote-and-page verification</strong><br>For each key claim, ask: can a user find the supporting passage quickly? If the UI provides snippets, check whether they actually support the claim (not just vaguely relate).</p></li><li><p><strong>Negative-control question (especially for 1c)</strong><br>Ask something you know is <em>not</em> in the document (&#8220;Does this paper report a randomized controlled trial?&#8221; when it doesn&#8217;t). The best behaviour is &#8220;not mentioned / not in the source,&#8221; not confident invention.</p></li><li><p><strong>Scope test</strong><br>Check what&#8217;s being summarised: abstract-only vs full text; for ebooks, chapter vs entire book. If scope is unclear, outputs are hard to interpret and easy to over-trust.</p></li></ol><h4>Category 2: Sequential single-document summarisation (synthesis tables / extraction columns)</h4><ol><li><p><strong>Relevance sensitivity test</strong><br>Use a query where only some retrieved papers are truly relevant. See whether the per-paper summaries make irrelevance obvious (e.g., summaries that can&#8217;t answer the question should look &#8220;off&#8221;).</p></li><li><p><strong>Extraction accuracy audit (sample-based)</strong><br>For any structured column (sample size, method, population, outcome), randomly audit 10&#8211;20 rows against the PDFs. Report an error rate; this becomes your baseline.</p></li><li><p><strong>Consistency across papers</strong><br>Check whether the system uses consistent definitions and units across rows (e.g., &#8220;n=&#8221; always means sample size; outcomes aren&#8217;t silently rephrased into different constructs).</p></li><li><p><strong>Missingness honesty</strong><br>When information is absent or unclear in a paper, does the tool leave it blank / mark &#8220;not reported,&#8221; or does it fill with plausible-sounding guesses?</p></li><li><p><strong>Provenance per cell</strong><br>For each extracted/summarised cell, can the system show the supporting excerpt? If not, every table becomes a manual scavenger hunt (and a trust sink).</p></li></ol><h4>Category 3: Query-based multi-document summarisation (RAG answers / synthesis across papers)</h4><ol><li><p><strong>Attribution test (claim &#8594; source mapping)</strong><br>Take 5&#8211;10 substantive claims in the answer. For each, verify that (a) a citation is provided, and (b) the cited source actually supports the claim.</p></li><li><p><strong>Coverage test (known-key-paper set)</strong><br>Use a question where you know the &#8220;must-cite&#8221; papers. Does the system retrieve and use them? </p></li><li><p><strong>Contradiction test</strong><br>Deliberately use a topic with well-known conflicting results (or seed a small set of papers with disagreement). Check whether the answer acknowledges disagreement and characterises it accurately, rather than smoothing it away<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-6" href="#footnote-6" target="_self">6</a>.</p></li><li><p><strong>&#8220;Not in the sources&#8221; also known as negative rejection test</strong><br>Ask a question that cannot be answered from the retrieved set. Good systems will say so, ask to broaden retrieval, or qualify strongly&#8212;not hallucinate<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-7" href="#footnote-7" target="_self">7</a>.</p></li><li><p><strong>Retraction / correction test</strong><br>Seed a retracted paper (or a paper with an expression of concern) alongside later work. Check whether the system flags status appropriately and avoids treating retracted findings as live evidence<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-8" href="#footnote-8" target="_self">8</a>.</p></li></ol><p>An alternative idea, I have been toying with is formally adapting <a href="https://harzing.com/blog/2016/04/are-referencing-errors-undermining-our-scholarship-and-credibility">Harzing&#8217;s 12 guidelines for academic referencing (last updated in 2001 which was designed purely for humans) as a standard to assess RAG output.</a></p><blockquote><p>Tip 2 : Traditionally, LLMs have a  strong bias to answer even when they shouldn&#8217;t, as such, if you have time for only one test, it is worth testing how they react to &#8220;null answers or results&#8221; to check for false positives/hallucations - basically 1.4, 2.1, 2.4, 3.4</p><p>Tip 3 : Take note of examples or scenarios where these tools fail. It is highly likely these are good scenarios to reuse.</p></blockquote><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!aO47!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!aO47!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png 424w, https://substackcdn.com/image/fetch/$s_!aO47!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png 848w, https://substackcdn.com/image/fetch/$s_!aO47!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png 1272w, https://substackcdn.com/image/fetch/$s_!aO47!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!aO47!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png" width="721" height="459" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c7000716-66a5-4142-931c-24fffb457799_721x459.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:459,&quot;width&quot;:721,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:27464,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/185621087?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!aO47!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png 424w, https://substackcdn.com/image/fetch/$s_!aO47!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png 848w, https://substackcdn.com/image/fetch/$s_!aO47!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png 1272w, https://substackcdn.com/image/fetch/$s_!aO47!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc7000716-66a5-4142-931c-24fffb457799_721x459.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2>Conclusion</h2><p>Not all &#8220;summaries&#8221; are created equal. Treating AI summarisation as a monolithic capability is a mistake. There is a world of difference between a pre-canned summary of a single article (Fixed Button) and a dynamic synthesis of conflicting claims across twenty papers (Query-based Multi-Document Summarisation).</p><p>For librarians and researchers, understanding this taxonomy is crucial for information literacy instruction and tool evaluation. A fixed, single-document summary is relatively safe but limited&#8212;essentially a glorified abstract. As we move into dynamic, multi-document RAG, utility increases substantially, but so does complexity and error potential.</p><p> </p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me coffee&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me coffee</span></a></p><div class="captioned-button-wrap" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/classifying-the-ways-llms-summarise?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="CaptionedButtonToDOM"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! This post is public so feel free to share it.</p></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/p/classifying-the-ways-llms-summarise?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://aarontay.substack.com/p/classifying-the-ways-llms-summarise?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>There is also a distinction between extractive summarisation (selecting and copying verbatim sentences from the source) and abstractive summarisation (generating novel text that paraphrases and synthesises). With LLMs, abstractive summarisation is now the dominant approach.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>Not all features mentioned are generated directly with LLMs. For example, the generated mindmaps from &#8220;Visualise Topics&#8221; in ProQuest Research Assistant likely use the LLM to call traditional clustering tools rather than generating visualisations directly.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-3" href="#footnote-anchor-3" class="footnote-number" contenteditable="false" target="_self">3</a><div class="footnote-content"><p>Deep Research mostly combines category 3 with iterative retrieval and self-checking&#8212;future post </p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-4" href="#footnote-anchor-4" class="footnote-number" contenteditable="false" target="_self">4</a><div class="footnote-content"><p>This is an &#8220;answer&#8221; rather than &#8220;summarization&#8221; because this is generated in response to user&#8217;s search query</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-5" href="#footnote-anchor-5" class="footnote-number" contenteditable="false" target="_self">5</a><div class="footnote-content"><p>I have a series of blog posts in my draft on this complicated topic!</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-6" href="#footnote-anchor-6" class="footnote-number" contenteditable="false" target="_self">6</a><div class="footnote-content"><p>Should the generated answer &#8220;play favourites&#8221; and suggest certain papers are more prestigious and hence the claims should be taken more seriously? Or should they be even handed just addressing the claims in each paper equally?</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-7" href="#footnote-anchor-7" class="footnote-number" contenteditable="false" target="_self">7</a><div class="footnote-content"><p>This is traditionally the hardest test for RAG systems to pass. Worth trying!</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-8" href="#footnote-anchor-8" class="footnote-number" contenteditable="false" target="_self">8</a><div class="footnote-content"><p>This is often highly dependent on the the source - whether it has up-to-date information about retraction status and whether it is fed to the LLM.</p></div></div>]]></content:encoded></item><item><title><![CDATA[The Blank Box Problem: Why It's Harder Than Ever to Know What to Type Into an AI Search Bar]]></title><description><![CDATA[We&#8217;ve traded keyword constraints for infinite potential, and created a massive usability crisis in the process.]]></description><link>https://aarontay.substack.com/p/the-blank-box-problem-why-its-harder</link><guid isPermaLink="false">https://aarontay.substack.com/p/the-blank-box-problem-why-its-harder</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Sat, 10 Jan 2026 18:25:59 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!O2xq!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!O2xq!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!O2xq!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!O2xq!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!O2xq!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!O2xq!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!O2xq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:138377,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!O2xq!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!O2xq!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!O2xq!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!O2xq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3a579c34-bf8a-4e82-980f-1405754de6f4_1024x559.jpeg 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>TLDR: There is a single, blinking cursor that defines our modern interaction with information. It sits in an empty rectangular box, waiting.</p><p>For two decades, search interfaces had clear affordances. Boolean operators, date filters, and &#8220;Advanced Search&#8221; screens signaled exactly what a database could and couldn&#8217;t do.</p><p>The new era of Agentic AI search has traded these constraints for infinite potential, replacing the dashboard with a blank text box. But this minimalism is deceptive. It has created a massive usability crisis I call the Blank Box Problem, trapping users in a double bind:</p><ul><li><p><strong>Input Ambiguity:</strong> We don&#8217;t know how to speak to the machine (Keywords vs. Natural Language vs. Engineered Prompts).</p></li><li><p><strong>Capability Ambiguity:</strong> We don&#8217;t know what the machine can actually <em>do</em> with our words (Search / Filter / Agentic tasks).</p></li></ul><p></p><h3>Introduction</h3><p>Traditional academic search interfaces were rich in affordances: Boolean operators signalled combinatorial logic, field codes revealed searchable metadata, dropdown menus exposed available filters, and facets signalled post-filter options. <em><a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">Most importantly, nobody in their right mind would expect it to act like a research assistant and try asking it to perform tasks requiring a complicated series of operations.</a></em></p><p>Then came ChatGPT, Perplexity, and the new era of agentic AI search. The boxes look the same, but the rules of engagement have shattered. The promise is seductive: we can now tell the AI search engine exactly what we want without pressing buttons or learning syntax.</p><p>We now face a usability crisis: we no longer know what to input into the search bar because the &#8220;Blank Box&#8221; hides the mechanics of the machine. Worse, we are caught in a Double Ambiguity:</p><ul><li><p><strong>Input Ambiguity:</strong> We don&#8217;t know how to speak to the machine (Keywords vs. Natural Language vs. Prompts).</p></li><li><p><strong>Capability Ambiguity:</strong> We don&#8217;t know what the machine can actually <em>do</em> with our words (Search vs. Filter vs. Agentic tasks).</p></li></ul><p>As I noted in <a href="https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered">my last blog post, vague use of terms like &#8220;AI-powered search engines&#8221; fuels this confusion</a>.</p><p>There&#8217;s a certain irony here. For decades, librarians lamented that users didn&#8217;t understand Boolean operators, truncation symbols, or field codes  (or just didn&#8217;t care to use facets). Now we&#8217;ve built systems that accept natural language&#8212;and users are more confused than ever about what they can actually do.</p><p>  </p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee!&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee!</span></a></p><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!s8bX!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!s8bX!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!s8bX!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!s8bX!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!s8bX!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!s8bX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png" width="1456" height="813" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:813,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:5999142,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!s8bX!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png 424w, https://substackcdn.com/image/fetch/$s_!s8bX!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png 848w, https://substackcdn.com/image/fetch/$s_!s8bX!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png 1272w, https://substackcdn.com/image/fetch/$s_!s8bX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff52aaa0c-0b11-4d9c-accd-a8b80cb41277_2752x1536.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p></p><h3>Part 1: Input Ambiguity</h3><p><em>Do I talk like a caveman, a human, or a Sorcerer?</em></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!aa-s!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!aa-s!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!aa-s!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!aa-s!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!aa-s!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!aa-s!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:192483,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!aa-s!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!aa-s!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!aa-s!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!aa-s!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7833bf21-755b-4287-b367-77cec8aa8e00_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>For twenty years, we were trained when using academic databases<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-1" href="#footnote-1" target="_self">1</a> to speak a specific pidgin language: &#8220;keyword search&#8221;. We stripped away grammar (e.g., &#8220;of&#8221;), articles (e.g., &#8220;the&#8221;), and politeness<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-2" href="#footnote-2" target="_self">2</a>. We didn&#8217;t ask, &#8220;<code>Is there an open access citation advantage</code>&#8221;. Instead we just typed: <code>open access citation advantage.</code> It was unnatural, but it was deterministic. We knew that if we typed X, the machine would look for X. </p><p>Now, <a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably">the rise of  &#8220;AI search&#8221;  or semantic search</a> suggests we might want or need to use other modes, but at this stage of transition it is hard to know when to abandon keyword search.  </p><p>The current state of AI search forces users to gamble on three different input modes, often with no indication of which triggers the best results:</p><ol><li><p><strong>The Caveman (Keyword Search)</strong><a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-3" href="#footnote-3" target="_self">3</a><strong>: </strong>The old reliable. Predictable, typically high precision, the longer the query, but often may fall prey to the &#8220;<a href="https://en.wikipedia.org/wiki/Vocabulary_mismatch">vocabulary mismatch problem&#8221;</a>.</p></li><li><p><strong>The Colleague (Natural Language): </strong>The promise of &#8220;ask me anything.&#8221; You talk to the AI like a colleague. But does it understand complex intent, or is it just dropping stop words and extracting keywords from your sentence?</p></li><li><p><strong>The Sorcerer (Prompt Engineering): </strong>The magic incantations. To extract value, we are told we must provide context, personas, constraints and <a href="https://arxiv.org/abs/2312.16171">even weird incentives</a> that supposedly help the black box of a LLM. e.g. &#8220;Act as a senior bibliometrician and find...I will give you $500 if you do well&#8221;</p></li></ol><blockquote><p>Because the interface is opaque, users might be developing folk theories about how to make it work. We add phrases like <a href="https://arxiv.org/abs/2201.11903">&#8220;take a deep breath&#8221; or &#8220;think step-by-step&#8221; not because we understand the system architecture, but because we hear it works well with GPT-3.5 or other old models</a> - not caring that some of this advice is outdated with reasoning models and more importantly academic AI search is a complicated system of different parts not just a LLM. We have moved from the deterministic logic of Boolean operators to the almost superstitious rituals of Prompt Engineering.</p></blockquote><p>Each mode carries different assumptions about how the system processes input. Keywords assume something like traditional information retrieval&#8212;matching terms, perhaps with query expansion. Natural language assumes the system understands semantic intent via embeddings. Prompt engineering assumes the system can follow complex instructions, maintain context, and execute multi-constraint searches.</p><p>The core problem is architectural opacity - users have no way to know which mode a given system expects or handles best. A system optimised for keyword matching may perform poorly with verbose natural language prompts. A system designed for conversational queries or one having limited capabilities (see later) may strip out or rewrite carefully crafted constraints. Users may sometimes learn this only through failed searches and inconsistent results<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-4" href="#footnote-4" target="_self">4</a>. </p><p></p><h3>This isn&#8217;t an abstract concern</h3><p>Choosing the wrong input mode for a given system can meaningfully degrade results.</p><p>Semantic Scholar is a case in point. As <a href="https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered#:~:text=The%20%E2%80%9CSemantic%20Scholar%E2%80%9D%20Confusion">I showed in my last blog post</a>, despite the name, its primary retrieval is lexical, not semantic. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!WbvB!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!WbvB!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg 424w, https://substackcdn.com/image/fetch/$s_!WbvB!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg 848w, https://substackcdn.com/image/fetch/$s_!WbvB!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!WbvB!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!WbvB!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg" width="728" height="903.6024242424243" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/dc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:false,&quot;imageSize&quot;:&quot;normal&quot;,&quot;height&quot;:1024,&quot;width&quot;:825,&quot;resizeWidth&quot;:728,&quot;bytes&quot;:68587,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:&quot;center&quot;,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!WbvB!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg 424w, https://substackcdn.com/image/fetch/$s_!WbvB!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg 848w, https://substackcdn.com/image/fetch/$s_!WbvB!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!WbvB!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdc40f95a-89e4-4040-9c3c-83b383d5586d_825x1024.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p><a href="https://arxiv.org/abs/2301.10140">Semantic Scholar&#8217;s primary retrieval pipeline when you search on the website</a></p><p>If you query it with natural language sentences expecting embedding-based retrieval, you&#8217;ll miss most of the relevant literature compared to a keyword search without stop words.</p><p>Below shows treating Semantic Scholar like a natural language search, results in only 13 results missing a ton of relevant results as compared to keyword search.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!-Ot_!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!-Ot_!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 424w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 848w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 1272w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png" width="1190" height="304" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/cf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:304,&quot;width&quot;:1190,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!-Ot_!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 424w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 848w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 1272w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Conversely, using &#8220;Caveman&#8221; keywords on a system designed for agentic reasoning (like the new Deep Research tools) might not be a total disaster but wastes the machine&#8217;s potential to understand nuance and counter-arguments.</p><p>If you read all this and are confused (you are not an information retrieval engineer!), you can be sure your users are too.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><h2>Part 2: Capability Ambiguity</h2><p>Even if we figure out how to ask, we hit a second wall: we don&#8217;t know what the system can actually do (Capability Ambiguity). When an AI search fails to deliver what users expect, the failure can occur in three distinct ways&#8212;and the AI blank box provides no way to determine which.</p><h3>1. Retrieval Abstraction: Similarity Spectrum vs Buckets</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!h386!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!h386!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg 424w, https://substackcdn.com/image/fetch/$s_!h386!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg 848w, https://substackcdn.com/image/fetch/$s_!h386!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!h386!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!h386!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg" width="1024" height="565" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:565,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:110588,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!h386!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg 424w, https://substackcdn.com/image/fetch/$s_!h386!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg 848w, https://substackcdn.com/image/fetch/$s_!h386!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!h386!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F86bec1c7-3194-46f0-ae74-5e1e3bdd675f_1024x565.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Search relevance engineer Doug Turnbull <a href="https://softwaredoug.com/blog/2025/12/09/rag-users-want-affordances-not-vectors">has argued</a> that the AI search industry fundamentally misframed the problem by building around vector similarity alone. Because users interact with LLMs in natural language, developers assumed the underlying retrieval should also use natural language similarity&#8212;encoding queries as embeddings and finding semantically similar passages on a spectrum.</p><p>But this is not always the right abstraction. Users don't only want semantic similarity. They often want what Turnbull calls <strong>selectors or what you can think of as binary buckets -</strong> structured filters on specific binary attributes. When a researcher asks for &#8220;peer-reviewed papers on CRISPR ethics published after 2020," they're expressing a query with clear selectors: document type (peer-reviewed papers), topic (CRISPR ethics), date range (post-2020). They expect the system to filter on these attributes or buckets not merely find passages that are "close" in some abstract embedding space.</p><p>Some academic AI search tools&#8212;particularly earlier versions of Elicit<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-5" href="#footnote-5" target="_self">5</a>&#8212;relied heavily on vector embeddings for retrieval and ranking with no way to apply pre-filters. </p><p>So why not combine both vector embedding retrieval with hard filtering? The issue is <a href="https://weaviate.io/blog/speed-up-filtered-vector-search">combining top-K vector search with attribute filtering (e.g., filtered HNSW) is technically difficult</a>, though <a href="https://www.elastic.co/search-labs/blog/filtered-hnsw-knn-search">newer techniques like ACORN are making it more tractable</a><a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-6" href="#footnote-6" target="_self">6</a><a href="https://www.elastic.co/search-labs/blog/filtered-hnsw-knn-search">.</a> </p><p>Today, some AI search tools like Consensus and Elicit offer numerous pre-filter options, while others like <a href="https://knowledge.exlibrisgroup.com/Primo/Product_Documentation/020Primo_VE/Primo_VE_(English)/015_Getting_Started_with_Primo_Research_Assistant">Primo Research Assistant</a> and <a href="https://www.elsevier.com/products/scopus/scopus-ai">Scopus AI </a>offer far fewer filter options than their &#8220;parent&#8221; non-AI search indexes.</p><p>When a user is faced with a blank chat box with no affordances like pre-filter checkboxes or checklists how is he to know to ask if he can ask in natural language to filter by say Publication year? </p><p>What I can say is if you assume the lack of affordances means the system can&#8217;t do any filtering - this is not always true. </p><p>For example, <em>in Undermind.ai, it can get you papers by publication year by natural language querying but it cannot filter reliably by publication type due to the fact that the underlying index (Semantic Scholar) does not even have this metadata value.</em></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!02rl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!02rl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg 424w, https://substackcdn.com/image/fetch/$s_!02rl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg 848w, https://substackcdn.com/image/fetch/$s_!02rl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!02rl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!02rl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg" width="1024" height="765" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:765,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:171221,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!02rl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg 424w, https://substackcdn.com/image/fetch/$s_!02rl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg 848w, https://substackcdn.com/image/fetch/$s_!02rl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!02rl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4e5b5df2-3b2c-4228-a466-53763eb69a77_1024x765.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Yet in both cases, Undermind will usually not warn you what you are asking for isn&#8217;t supported and try anyway to produce a result without an error message.</p><h3>2. Filter Recognition in natural language</h3><p>Even when systems basic search index does support structured constraints&#8212;date ranges, document types, citation thresholds&#8212;a separate question arises: does the natural language interpretation layer recognise when users are invoking them?</p><p>Consider common search constraints expressed naturally:</p><ul><li><p>&#8220;<em><strong>from 2000 to 2010</strong></em>&#8221; or &#8220;<em><strong>published in the last five years</strong></em>&#8221;</p></li><li><p>&#8220;<em><strong>sorted by most cited</strong></em>&#8221; or &#8220;<em><strong>most recent first</strong></em>&#8221;</p></li><li><p>&#8220;<em><strong>only peer-reviewed articles</strong></em>&#8221; or &#8220;<em><strong>excluding conference papers</strong></em>&#8221;</p></li><li><p>&#8220;<em><strong>English language only</strong></em>&#8221;</p></li><li><p>&#8220;<em><strong>open access articles</strong></em>&#8221;</p></li></ul><p>The underlying search infrastructure might even support all of these filters. But the natural language layer&#8212;the part that parses your query<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-7" href="#footnote-7" target="_self">7</a> and decides what to do with it&#8212;may or may not recognise these requests.</p><p>Consider a user entering a specific request like:</p><blockquote><p>&#8220;Show me <em><strong>peer-reviewed articles</strong></em> from <em><strong>2010 to 2015</strong></em> about machine learning, <em><strong>ordered by most cited</strong></em>.&#8221;</p></blockquote><p>This seems like a clear instruction. However, depending on which AI Research Assistant the user faces, the result is wildly different:</p><ul><li><p><strong>The &#8220;Deep Parser&#8221; (e.g., Web of Science Research Assistant):</strong> <a href="https://webofscience.zendesk.com/hc/en-us/articles/31437630410129-Web-of-Science-Research-Assistant#h_01JGKZH4M90REHBHPKARR2W4ZJ">This tool is built to understand a ton of specific metadata triggers (if a filter or sort option appears in Web of Science you can likely trigger it using natural language!</a>). It recognizes &#8220;2010-2015&#8221; not just as text, but as a command to apply a <strong>Publication Date Filter</strong>. It understands &#8220;ordered by most cited&#8221; as a specific <strong>Sort Function</strong>. The AI successfully translates this and many other filters from natural language into structured database queries.</p></li><li><p><strong>The &#8220;Surface Skimmer&#8221; (e.g., Primo Research Assistant):</strong> This tool might process the same query very differently despite being from the same company. <a href="https://knowledge.exlibrisgroup.com/Primo/Product_Documentation/020Primo_VE/Primo_VE_(English)/015_Getting_Started_with_Primo_Research_Assistant#:~:text=Research%20Questions%20Section-,Refined%20Search,the%20Online%20availability%20check%20box%20to%20filter%20your%20results%20by%20availability.,-Refined%20Search%20Options">While it can actually &#8220;understand&#8221; and parse the input to set the publication year ranges but does it know what &#8220;peer-reviewed&#8221; means as a metadata filter? (Spoiler : it does!). Or will it just look for the phrase &#8220;peer-reviewed&#8221; in the text? The user has no way of knowing.  Also, can it sort by citation counts (Spoiler: it cannot). </a></p></li></ul><p>More recently, <a href="https://knowledge.exlibrisgroup.com/Primo/Product_Documentation/020Primo_VE/Primo_VE_(English)/040Search_Configurations/Natural_Language_Search_in_the_NDE_UI">Primo NDE</a><a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-8" href="#footnote-8" target="_self">8</a><a href="https://knowledge.exlibrisgroup.com/Primo/Product_Documentation/020Primo_VE/Primo_VE_(English)/040Search_Configurations/Natural_Language_Search_in_the_NDE_UI"> introduced "natural language search"</a><strong>.</strong> Here's what it says </p><blockquote><p>The Natural Language Search feature enables users to formulate queries in normal spoken language, and automatically converts them into the structured format compatible with Primo&#8217;s Advanced Search. For example, the user could enter the query, &#8220;Find me US history journals in English that are available online,&#8221; and the system would create a query with the appropriate criteria for the search.</p></blockquote><p>So far, similar (use of LLM to translate to search strategy) to what we see in <a href="https://aarontay.substack.com/p/the-reproducibility-and">Web of Science Research Assistant, Primo Research Assistant</a>, <a href="https://aarontay.substack.com/p/a-deep-dive-into-ebscohosts-natural-4a6">EBSCO Natural Language Search</a> etc.</p><blockquote><p>Not only does the Natural Language Search generate queries from free text, it also identifies certain catch words in the text that can be used to define the scope and automatically select the appropriate filters for the search. For example, if the term &#8220;journal&#8221; appears in the text, the scope of the search is limited to journals<em>, </em>and if a language is specified, the language filter is automatically turned on.</p></blockquote><blockquote><p>The transformation of the original query into the structured format is performed using generative AI, via ChatGPT 4.1Mini. The elements of the query, such as resource types, date filters, full text preferences, language, and advanced fields like Title or Subject, are classified by the AI system, which uses this information to generate the basic Boolean query and then expands it using related concepts. Ambiguous inputs are handled intelligently by mapping to multiple fields (e.g., both Title and Subject) to ensure broad yet accurate retrieval.</p></blockquote><p>Ah, so it can recognise filters in your natural language query which is invoked by clicking on &#8220;Ask Anything&#8221; button.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!A_M6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!A_M6!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png 424w, https://substackcdn.com/image/fetch/$s_!A_M6!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png 848w, https://substackcdn.com/image/fetch/$s_!A_M6!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png 1272w, https://substackcdn.com/image/fetch/$s_!A_M6!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!A_M6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png" width="1427" height="872" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f6d4f496-1334-4fec-b291-e903735ff654_1427x872.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:872,&quot;width&quot;:1427,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:85885,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!A_M6!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png 424w, https://substackcdn.com/image/fetch/$s_!A_M6!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png 848w, https://substackcdn.com/image/fetch/$s_!A_M6!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png 1272w, https://substackcdn.com/image/fetch/$s_!A_M6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff6d4f496-1334-4fec-b291-e903735ff654_1427x872.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Here&#8217;s the problem. Which filters can you use purely by asking in natural language? You won&#8217;t know without tons of trial and error or <a href="https://knowledge.exlibrisgroup.com/Primo/Product_Documentation/020Primo_VE/Primo_VE_(English)/040Search_Configurations/Natural_Language_Search_in_the_NDE_UI#:~:text=Search%C2%A0checkbox.-,Special%20Terms,automatically%20apply%20filters%20and%20facets%20to%20the%20search%20results%2C%20as%20follows%3A,-Advanced%20search%20fields">reading the documentation</a>. </p><p>I would wager many people might think anything that is a filter in Primo NDE could be invoked by natural language queries. In fact, while a lot of filters and facets can be invoked this way (e.g. resource type, open access, available online, peer-reviewed, held by library, language, creator), some cannot (e.g. subject, collection, etc.).  </p><p>For example, <a href="https://bsky.app/profile/aarontay.bsky.social/post/3mbw4tvkpvc2n">while testing, I was initially encouraged by the fact that most of the filters in the Primo NDE instance I was testing could be invoked</a>&#8212;e.g. the following works correctly:</p><p>Find me <em><strong>open access</strong></em> papers on large language models  </p><p>Find me <em><strong>peer-reviewed</strong></em> papers on large language models  </p><p>Find me papers on large language models <em><strong>in Spanish</strong></em></p><p>Then I tried to invoke the Subject filter by trying</p><p>Find me papers on large language models in <em><strong>&lt;subject as per Primo NDE filter values&gt;</strong></em></p><p>or the sorting function</p><p>Find me papers on large language models and <em><strong>sort it by date-newes</strong></em>t<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-9" href="#footnote-9" target="_self">9</a></p><p>But this time it refused to invoke the subject filter, nor sort by date-newest. I then tried different variants of the query input, etc., to no avail, and I guess it probably wasn&#8217;t supported - but you could never by sure.</p><p>Of course, when <a href="https://knowledge.exlibrisgroup.com/Primo/Product_Documentation/020Primo_VE/Primo_VE_(English)/040Search_Configurations/Natural_Language_Search_in_the_NDE_UI#:~:text=Search%C2%A0checkbox.-,Special%20Terms,automatically%20apply%20filters%20and%20facets%20to%20the%20search%20results%2C%20as%20follows%3A,-Advanced%20search%20fields">you look at the documentation</a>, you realise it could never have worked as it wasn&#8217;t a supported type to filter on.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!sUVG!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!sUVG!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png 424w, https://substackcdn.com/image/fetch/$s_!sUVG!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png 848w, https://substackcdn.com/image/fetch/$s_!sUVG!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png 1272w, https://substackcdn.com/image/fetch/$s_!sUVG!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!sUVG!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png" width="1421" height="453" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:453,&quot;width&quot;:1421,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:35357,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!sUVG!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png 424w, https://substackcdn.com/image/fetch/$s_!sUVG!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png 848w, https://substackcdn.com/image/fetch/$s_!sUVG!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png 1272w, https://substackcdn.com/image/fetch/$s_!sUVG!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe86556e3-cc77-4448-90ce-ce4dcc4f8ff6_1421x453.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Because the interface is identical&#8212;an empty box&#8212;users cannot distinguish between a tool that respects metadata constraints and one <a href="https://aarontay.substack.com/p/the-case-of-the-vanishing-hit-count">that merely performs semantic fuzzy search and always returns the closest top K results even if it ignores the filter constraints.</a></p><p> </p><h3>3. Workflow Composition Problem</h3><p>The third point concerns what operations the system can perform and whether it can combine them.</p><p>Consider this research task: &#8220;Find me papers referenced by Article X, then identify related papers that could have been cited but weren&#8217;t.&#8221;</p><p>You normally wouldn't expect this to work in the old days with conventional search but with talk about agentic search, ai-powered research assistants users may expect this to work.</p><p>While some agentic systems can indeed do it, this requires running multiple operations in sequence: retrieve the article, extract its reference list, search for semantically related papers, compare the sets, identify gaps. Still, it's a reasonably simple enough research workflow.</p><p>But AI search tools vary dramatically in whether they can execute it. <a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">In my testing, &#8220;deep research&#8221; or agentic search tools like Elicit, Undermind, Scite Assistant, and Consensus failed at this task, despite many having citation searching or parsing capability&#8212;probably due to predetermined workflows</a>.</p><p>Agentic systems with genuine compositional capability can accomplish this: fetch the article, parse references, run searches, synthesise results&#8212;potentially working with a sequence of steps that wasn&#8217;t predetermined by the designers.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!rdcp!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!rdcp!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!rdcp!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!rdcp!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!rdcp!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!rdcp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!rdcp!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!rdcp!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!rdcp!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!rdcp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Systems with fixed workflows like <a href="https://asta.allen.ai/">AI2&#8217;s Asta (formerly AI2 Paper Finder),</a> Undermind.ai, Elicit, Consensus implement predetermined pipelines: &#8220;literature search,&#8221; &#8220;citation chasing,&#8221;, &#8220;evaluation of results&#8221; or &#8220;summarisation&#8221; in a fairly fixed sequence. The LLM decides which pre-built flow to invoke, but it cannot compose novel sequences. The operations exist in isolation, not as combinable primitives.</p><p>The user staring at the search box has no way to know which category their tool falls into. They may assume the limitation is their own&#8212;that they haven&#8217;t found the right phrasing&#8212;when they&#8217;re hitting an architectural ceiling. This is perhaps the cruellest form of capability ambiguity: users engage in elaborate prompt engineering to unlock capabilities that don&#8217;t exist. </p><p>(For more details, see <em><a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">Deep Research, Shallow Agency: What Academic Deep Research Can and Can&#8217;t Do</a></em><a href="https://aarontay.substack.com/p/how-agentic-are-academic-deep-research">.</a>)</p><p>  </p><h3>Why does a search fail?</h3><p>Failures in most AI search are usually silent and indistinguishable from the user&#8217;s perspective. A search returning irrelevant results could be failing for any of the following reasons and it is not easy for a user to understand why:</p><ul><li><p>Whether they used the wrong input mode (e.g. using natural language query with a lexical search system)</p></li><li><p>Whether they phrased their query poorly within the correct mode (e.g. Use of wrong keywords in a lexical search system)</p></li><li><p>Whether their filters were recognized and applied (e.g. asking in natural language to &#8220;filter to review articles&#8221; but this isn&#8217;t a field the system can filter on or it can do so but the natural language parser isn&#8217;t set up to do so).</p></li><li><p>Whether the system lacks the  workflow operations (e.g. do forward citations of paper X) they need to do the task.</p></li><li><p>Whether those operations exist (do forward citations of paper x) in the system but can&#8217;t be composed into their desired workflow</p></li></ul><p><em>More dangerously, parts of the search could silently fail or be ignored.</em> This is certainly true for embedding systems that simply find the closest matches, LLMs that rewrite your input query (e.g., Primo Research Assistant), and Deep Research tools (e.g., Undermind.ai). You will always get 'something,' even when your query is not correctly interpreted!</p><h4>Case Study: The Danger of the &#8220;Silent Rewrite&#8221;</h4><p>The most dangerous failure is the one users cannot see. Consider this query I ran in <strong>Primo Research Assistant</strong>:</p><p><code>Find articles on climate change in 2023 , review articles only and do forward citation search of top 10 papers</code></p><p>It happily ran with no trace of an error despite not being able to filter by review articles, not to mention it definitely couldn&#8217;t do things like forward citation. Below shows the result.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!MhMD!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!MhMD!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png 424w, https://substackcdn.com/image/fetch/$s_!MhMD!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png 848w, https://substackcdn.com/image/fetch/$s_!MhMD!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png 1272w, https://substackcdn.com/image/fetch/$s_!MhMD!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!MhMD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png" width="1330" height="848" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:848,&quot;width&quot;:1330,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:164317,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!MhMD!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png 424w, https://substackcdn.com/image/fetch/$s_!MhMD!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png 848w, https://substackcdn.com/image/fetch/$s_!MhMD!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png 1272w, https://substackcdn.com/image/fetch/$s_!MhMD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff2b32993-c99f-48ac-9f8b-5e92d2b90399_1330x848.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The <a href="https://knowledge.exlibrisgroup.com/Primo/Product_Documentation/020Primo_VE/Primo_VE_(English)/015_Getting_Started_with_Primo_Research_Assistant#:~:text=internal%20preventative%20measure.-,How%20It%20Works,the%20query%20language%2C%20and%20the%20other%20variations%20will%20be%20in%20English.,-Results%20Retrieval%20%E2%80%93%20The">LLM in Primo Research Assistant rewrote the input to a boolean search without the restrictions and ran it</a>. Below is the rewritten query. Notice what it dropped.</p><p><code>(climate change impacts) OR (global warming) OR (climate change adaptation) OR ((climate change) OR (global warming)) OR ((climate change) AND (environmental policy)) OR (&#8221;climate change&#8221;) OR ((global warming) OR (climate variability)) OR ((climate change) AND (mitigation)) OR ((greenhouse gases) AND (climate impact)) OR (environmental change) OR (climate change)</code></p><p>There is also another subtle failure. Primo Research Assistant can correctly parse query inputs like </p><p><code>Papers on X from 2023 to 2024</code>, </p><p>but when the query input is</p><p><code>Papers on X in 2023 </code></p><p>was interpreted in Primo Research Assistant as 2023 to 2025 as shown in the applied filter at the bottom of the screen capture!</p><p>You might then think - maybe if you just prompt in the right way, you could get it to filter to only 2023 (maybe be adding &#8220;Only&#8221;)<a class="footnote-anchor" data-component-name="FootnoteAnchorToDOM" id="footnote-anchor-10" href="#footnote-10" target="_self">10</a>. </p><p>Here lies another problem, even if the user notices that the query input wasn&#8217;t followed, it might lead to &#8220;prompt thrashing&#8221;&#8212;users reformulating the same request in increasingly elaborate ways, hoping to unlock functionality that may not exist or may be failing at something query reformulation doesn&#8217;t (or can&#8217;t ever) address. They blame their query formulation when the actual limitations could, say, be architectural.</p><p>Meanwhile, systems that do support complex operations provide no signal that such capabilities are available. A user who never thinks to ask &#8220;compare the citation networks of these two papers&#8221; will never discover that the system can do it.</p><h3>Designing a Way Out</h3><p>Turnbull argues the solution lies in reconceiving the role of LLMs in search. Their power isn't semantic similarity&#8212;it's query understanding. An LLM can take free text ("suede, geometric couch") and produce a structured query with typed fields: style (geometric), material (suede), classification (Living Room / Seating / Sofas). Each field maps to an appropriate retrieval technique&#8212;visual embeddings for style, taxonomic matching for materials, hierarchical classification for categories.</p><p>This decomposition serves multiple purposes. It enables precision where precision is possible. It makes the system&#8217;s interpretation visible and correctable. And crucially, it provides affordances: users can see how their query was parsed and understand what refinements are available. The continuous similarity score of vector search offers no such guidance.</p><p>But most AI search interfaces don&#8217;t expose this architecture. They present a blank box and hope the system will figure out which parts of the input are filter requests, which are content queries, and which are workflow instructions and fail silently.</p><h3>Concrete Solutions</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!cCIB!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!cCIB!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!cCIB!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!cCIB!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!cCIB!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!cCIB!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:153465,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!cCIB!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!cCIB!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!cCIB!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!cCIB!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F204209f1-5798-45cb-9971-1e788e9d1713_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Solutions exist and some are already in use in existing products. I will list some of them from most frequently seen to less frequently seen.</p><p><strong>Sample prompts that demonstrate expectations. </strong>It is common practice today to list sample queries below the search box.<strong> But </strong>example queries should be chosen with care to address both input mode and capability. Are examples terse keywords or elaborate instructions? Do they demonstrate filter syntax, complex operations, or both? Prompts like &#8220;Find highly cited papers on CRISPR ethics from 2020-2024&#8221; reveal that dates and citation thresholds are recognised; &#8220;Compare the methodology of Smith 2020 and Jones 2021&#8221; reveals that document comparison is available.</p><p><strong>Hybrid UI: the return of filters.</strong> There&#8217;s no reason we can&#8217;t add pull-down menus and buttons to signal available affordances. But consistency matters&#8212;if the interface shows a dropdown for document type, users should be able to request the same filter in natural language.</p><p><strong>Type-ahead that reveals constraints. </strong>As users type &#8220;find papers from...&#8221; the system could surface suggestions: &#8220;...from 2020 onwards,&#8221; &#8220;...from Nature,&#8221; &#8220;...from Harvard University.&#8221; This signals which constraint types are recognised while guiding users toward phrasings the system handles well.</p><p><strong>Explicit constraint confirmation. Before executing a search, the system could display parsed constraints for confirmation: &#8220;Date: 2020-2024 | Type: peer-reviewed | Sort: citation count | Topic: CRISPR ethics.&#8221; Users see exactly what was recognised, can correct misinterpretations, and learn the system&#8217;s vocabulary through exposure.</strong></p><p><strong>LLM query intent detection to block unsupported inputs  </strong>Pretty much what it says on the tin. The LLM tries to interpret the intent of each query, if it detects that a query is asking for something the tool isn&#8217;t designed to do, it stops. </p><p><strong>Expose the tool layer. </strong>For systems built on protocols like MCP, surface available operations directly: &#8220;Search database X&#8221; &#8220;Retrieve (forward) citations from Paper Y,&#8221; &#8220;Compare documents,&#8221; &#8220;Extract methodology sections.&#8221; When users see that citation network analysis isn&#8217;t among the available tools, they stop blaming their phrasing and adjust expectations&#8212;or choose a different system. Systems with fixed workflows should make clear what exactly is happening behind the scenes to help head off misunderstandings.</p><p><strong>Template libraries for common workflows. </strong>Offer structured starting points for workflows: &#8220;Find gap in citations,&#8221; &#8220;Compare methodology across papers,&#8221; &#8220;Trace influence of seminal work.&#8221; Each template pre-configures and exposes the right combination of tools while remaining editable for workflow transparency. See for example<a href="https://scispace.com/agents"> SciSpace Agent Gallery.</a></p><h3>Conclusion</h3><p>These solutions address symptoms, but the underlying tension may be irresolvable. The promise of natural language search is liberation from formal query languages; the reality is that formal languages encoded precise information about both input expectations and system capabilities that natural language cannot easily replace.</p><p>We&#8217;re in a transitional period where AI search tools vary enormously across many dimensions&#8212;different retrieval abstractions, different filter recognition capabilities, different workflow architectures. Yet they present nearly identical blank text boxes that reveal nothing.</p><p>This results in a massive <strong>&#8220;Cost of Discovery.&#8221;</strong> In the past, if you learned how to use Scopus, you largely knew how to use Web of Science. Now, every AI wrapper has a unique, hidden architecture with varying capabilities.</p><p><em>This places an unreasonable burden on users to discover through experimentation what each system expects and what each system can do. </em>The ambiguities compound: users may not be able to easily systematically test because of so much uncertainty in the different subsystems of the search.  </p><p>For librarians and information professionals, this creates both challenge and opportunity. The challenge is obvious: how do we teach search skills when the skills required vary by platform in ways that aren&#8217;t visible? Traditional database instruction could focus on Boolean logic and controlled vocabularies. AI search instruction must address input mode, retrieval method, filter recognition, and workflow composition&#8212;none of which are documented completely and consistently.</p><p>The opportunity is that this confusion creates demand for exactly the kind of critical evaluation that information professionals excel at. <a href="https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered">Mapping the capability landscape of AI search tools&#8212;not just feature lists but actual functional boundaries at each level</a>&#8212;is work that needs doing. Understanding when embedding retrieval is in play and hence when natural language input is appropriate, when filter triggers are recognised, when workflows can be composed: this technical evaluation distinguishes informed tool selection from marketing-driven adoption or fear-driven resistance.</p><p>Until AI search interfaces evolve better affordances, we may need to return to an old practice: demanding that documentation exist for input expectations, filter vocabularies, retrieval mechanisms, and workflow capabilities&#8212;and that it be surfaced at the point of need rather than buried in help pages no one visits.</p><p><strong>The blank search box feels like an invitation to ask anything. It&#8217;s actually a test at multiple levels</strong>&#8212;of whether you know how to ask, whether you know what you can ask for, and whether you can diagnose what actually doesn&#8217;t work when you don&#8217;t get what you need. </p><p> </p><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-1" href="#footnote-anchor-1" class="footnote-number" contenteditable="false" target="_self">1</a><div class="footnote-content"><p>Most academic databases like Scopus enforced hard boolean logic, followed by ranking of the matched set with <a href="https://emschwartz.me/understanding-the-bm25-full-text-search-algorithm/">TF-IDF/BM25</a>. A very rare few, typically academic web search engines like Google Scholar would still be lexical search but would not be strict Boolean typically employing just ranked retrieval with BM25 without Boolean).</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-2" href="#footnote-anchor-2" class="footnote-number" contenteditable="false" target="_self">2</a><div class="footnote-content"><p>I&#8217;ve used the &#8220;Caveman&#8221; analogy here for keyword search for a bit of fun. It isn&#8217;t meant to suggest the technical is outdated - both keyword and semantic search have their points. A &#8220;Programmer/Robot&#8221; comparison would be more suitable if nested Boolean were used. But we know in reality, most users default to simple keyword searches, dropping the stop words and letting the magic of <a href="https://webofscience.zendesk.com/hc/en-us/articles/20016122409105-Search-Operators#:~:text=Implicit%20%22AND%22,the%20same%20number%20of%20results.">implicit AND</a> to do the work.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-3" href="#footnote-anchor-3" class="footnote-number" contenteditable="false" target="_self">3</a><div class="footnote-content"><p>Ibid.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-4" href="#footnote-anchor-4" class="footnote-number" contenteditable="false" target="_self">4</a><div class="footnote-content"><p>So what should you input?  If you know roughly what is going on (and I will talk about how to roughly figure out what is going on under the hood in a future post), here is what you should do.</p><p><a href="https://aarontay.substack.com/p/why-entering-your-query-in-natural">If your query goes directly to an embedding model for retrieval, natural language works well (better than keyword)&#8212;these models are trained on natural language and capture semantic similarity</a>. That said, many modern systems use hybrid retrieval&#8212;combining embeddings with keyword-based methods like BM25&#8212;so well-chosen terms still matter, particularly for named entities or specialist vocabulary.</p><p>As for prompt engineering, <a href="https://aarontay.substack.com/p/prompt-engineering-with-retrieval">I&#8217;ve been sceptical about elaborate tactics&#8212;particularly those lifted wholesale from papers based on GPT-3.5/4 without independent testing.</a> But that scepticism was grounded in my 2023/2024 understanding. Since then, LLMs have improved considerably through better tool use training and agentic orchestration, and may respond better to complicated prompts, so the picture is less clear.</p><p>Still, if an LLM sits between you and the retrieval layer&#8212;as in more advanced AI search tools&#8212;it will likely rewrite or expand your query before searching. I think elaborate phrasing is probably wasted effort; the system normalises your input anyway. What matters is clearly expressing your information need.</p><p>In agentic systems with iterative retrieval, the LLM&#8217;s system prompt and workflow architecture dominate. Your exact wording matters less; specifying constraints (date ranges, study types, specific populations) in plain language may help if the system parses them (see later), but this is system-dependent.</p><p><strong>Practical advice:</strong> Describe what you want in clear natural language. Include specific terms the system must match. Don&#8217;t bother with elaborate prompt engineering tactics&#8212;either the embedding model won&#8217;t understand them, or the LLM will rewrite your input regardless. </p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-5" href="#footnote-anchor-5" class="footnote-number" contenteditable="false" target="_self">5</a><div class="footnote-content"><p>*<a href="https://elicit.com/blog/semantic-search/">Elicit has since moved to SPLADE,</a> a learnt sparse retrieval method. This is a hybrid semantic+lexical search method - which allows the use of <a href="https://www.geeksforgeeks.org/dbms/inverted-index/">inverted index</a> (used also by lexical search) that makes filtering relatively computationally cheap.  (see <a href="https://support.elicit.com/en/articles/2300417">list of advanced filters available in Elicit</a>)</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-6" href="#footnote-anchor-6" class="footnote-number" contenteditable="false" target="_self">6</a><div class="footnote-content"><p><a href="https://aarontay.substack.com/i/169318495/why-hit-counts-by-vector-similarity-are-hard">Vector similarity of dense embeddings usually involve finding the top K most similar embeddings to the query embedding</a>. With a large enough collection, it may be too slow to do a brute force search so systems employ approximate nearest neighbour (ANN) indices like <a href="https://open.substack.com/pub/sarthakai/p/a-vectordb-doesnt-actually-work-the">HNSW (</a><strong><a href="https://open.substack.com/pub/sarthakai/p/a-vectordb-doesnt-actually-work-the">Hierarchical Navigable Small World</a></strong><a href="https://open.substack.com/pub/sarthakai/p/a-vectordb-doesnt-actually-work-the">)</a>. But these indices are optimised only for the distribution of the full dataset. For example, HNSW builds a hierarchical graph where nodes (vectors) are connected to their nearest neighbours across multiple layers, with navigation starting at sparse upper layers and refining at denser lower layers. During search, the algorithm greedily traverses edges towards the query vector. However, when filters exclude many vectors, the graph connectivity breaks&#8212;the greedy path may dead-end at filtered-out nodes, or the remaining filtered subset forms disconnected islands in the graph structure. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!rvZC!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!rvZC!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!rvZC!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!rvZC!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!rvZC!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!rvZC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:118910,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/181104601?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!rvZC!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!rvZC!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!rvZC!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!rvZC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60aeb784-d169-4777-8d81-9123788877a9_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>The index doesn't "know" about filter constraints, so traversal routes optimised for the full dataset fail to efficiently find nearest neighbours within the filtered subset. Post-filtering (retrieve K, then filter) risks returning fewer than K results. Pre-filtering (filter, then search) means either rebuilding indices per filter (impractical) or using the mismatched global index (suboptimal recall). <a href="https://weaviate.io/blog/speed-up-filtered-vector-search">Recent work such as ACORN addresses this by selectively expanding search to second-hop neighbours (neighbours of neighbours) when immediate neighbours are filtered out, maintaining connectivity at the cost of additional distance computations.</a></p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-7" href="#footnote-anchor-7" class="footnote-number" contenteditable="false" target="_self">7</a><div class="footnote-content"><p>Retrieval systems use several approaches to recognise filters in natural language. Rule-based pattern matching is cheap but brittle&#8212;it fails on paraphrases. Named entity recognition can tag journals and authors but requires domain-specific training. Modern systems increasingly use LLM-based query decomposition, parsing natural language into structured filters. This is more flexible but introduces new problems: LLMs may hallucinate filter capabilities (easy to verify though), parse similar queries inconsistently, or silently treat filter requests as topical content</p><p>Disclosure : Images are generated using Nano Banana Pro.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-8" href="#footnote-anchor-8" class="footnote-number" contenteditable="false" target="_self">8</a><div class="footnote-content"><p>Primo NDE (New Design Experience) is a new interface refresh of Primo. It is not the same as Primo Research Assistant which is a seperate module which you can access via Primo. Despite that, both Primo Research Assistant and the natural language search feature in Primo NDE use LLMs to translate query input into Boolean.</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-9" href="#footnote-anchor-9" class="footnote-number" contenteditable="false" target="_self">9</a><div class="footnote-content"><p>As noted already, this isn&#8217;t an absurd ask, since Web of Science Research Assistant by the same company does support this query!</p></div></div><div class="footnote" data-component-name="FootnoteToDOM"><a id="footnote-10" href="#footnote-anchor-10" class="footnote-number" contenteditable="false" target="_self">10</a><div class="footnote-content"><p>So far as I can tell, there isn&#8217;t a way.</p></div></div>]]></content:encoded></item><item><title><![CDATA[What Do We Actually Mean by "AI-Powered Search"? ]]></title><description><![CDATA[When we say "AI-powered search engine," we're conflating at least four different things&#8212;and your concerns about one may not apply to another.]]></description><link>https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered</link><guid isPermaLink="false">https://aarontay.substack.com/p/what-do-we-actually-mean-by-ai-powered</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Sat, 27 Dec 2025 21:24:18 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!F504!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!F504!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!F504!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 424w, https://substackcdn.com/image/fetch/$s_!F504!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 848w, https://substackcdn.com/image/fetch/$s_!F504!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!F504!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!F504!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg" width="1024" height="541" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:541,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!F504!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 424w, https://substackcdn.com/image/fetch/$s_!F504!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 848w, https://substackcdn.com/image/fetch/$s_!F504!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!F504!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee (via ko-fi)</span></a></p><p>I've been watching the reactions to <a href="https://aarontay.substack.com/p/scholar-labs-early-review-google">Google Scholar Labs</a> with considerable interest. The responses range from enthusiastic embrace to outright rejection. One response particularly intrigued me&#8212;someone mentioned they were initially reluctant to try because they'd heard it was "AI-powered" but became more interested when they read my review and realized what that actually meant (they expected it to generate answers to questions when all it did was do better ranking).</p><p>Another interesting puzzle was when I noticed some library guides listing Semantic Scholar as &#8220;Semantic/Neural Search&#8221; when a <a href="https://arxiv.org/abs/2301.10140">technical look at their main retrieval method reveals the main search is still largely lexical search</a>. </p><p>While one can understand and agree with the listing of Semantic Scholar as &#8220;AI powered&#8221; due to clear AI features like TLDR, doing the same for <a href="http://lens.org">Lens.org</a> and <a href="http://openalex.org">OpenAlex</a> is a much harder sell, because they not only just do keyword search but they lack the obvious AI features of Semantic Scholar.</p><p>It&#8217;s made me realise we might all be talking past each other because we haven&#8217;t actually defined what we mean.</p><p>&#8220;AI-powered search engine&#8221; is a handy catch-all term used by vendors, but it actually hides a diverse set of systems and functionality. In this post, I&#8217;ll dissect the different ways academic search can be &#8220;AI-powered&#8221; so you can decide which types actually cross the line for you.</p><p>I am going to argue that we often mean at least 4 different things when we call something &#8220;AI-powered search&#8221;</p><ul><li><p><strong>Level 1: Post-Retrieval AI Features</strong></p></li><li><p><strong>Level 2: Going beyond Lexical Search with Semantic Search</strong></p></li><li><p><strong>Level 3: LLMs for Retrieval and/or Relevance Ranking</strong></p></li><li><p><strong>Level 4: Synthesis and Generation Across Papers</strong></p></li><li><p><strong>Level 0??: Use of AI to  extract, cluster, or organise metadata used for retrieval</strong></p></li></ul><p>Levels here may not be the right framing, as the four different categories are largely orthogonal (except maybe Level 3 is a subset of level 2), but they map to most common academic search products (e.g. Level 4 is usually Deep Research)  and higher levels generally reflect higher risk and greater amount of pushback from librarians.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><h2>The Spectrum of AI in Search</h2><p><strong>Level 1: Post-Retrieval AI Features</strong></p><p>Does &#8220;AI-powered search engine&#8221; mean &#8220;AI&#8221; that impacts the search process only? Not necessarily.</p><p>There&#8217;s a whole category of AI features that don&#8217;t affect the search results you get at all. Things like optional summarisation of individual items (e.g., <a href="https://about.ebsco.com/artificial-intelligence/products/ai-insights">AI Insights on Ebscohost databases</a>), translation tools, or text-to-speech features.</p><p>These are post-retrieval conveniences. You search, you get your results list (however that list was generated), and then you have the option to use AI to help you process what you found. The search itself? Unchanged. </p><p>In theory, if you don&#8217;t like these features, you can ignore them. </p><p><strong>Level 2:  Going beyond Lexical Search with Semantic Search</strong></p><p>Now let&#8217;s get into actual search mechanisms. Suppose a search engine doesn&#8217;t do traditional lexical/keyword matching but instead uses &#8220;semantic search&#8221;&#8212;where <a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably">queries are run through an encoder model to convert into embeddings and matched against the embeddings of indexed documents to get a relevance score</a>. </p><blockquote><p>&#8220;Semantic search&#8221; can refer to (1) meaning-aware retrieval (dense embeddings / neural retrievers), (2) sparse neural retrieval (not dense embeddings, but still &#8220;neural&#8221; e.g. SPLADE) (3) query expansion / thesauri / ontologies (not embeddings). (1) is by far the most popular today and discussed here.</p></blockquote><p> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!hyXk!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!hyXk!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477 424w, https://substackcdn.com/image/fetch/$s_!hyXk!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477 848w, https://substackcdn.com/image/fetch/$s_!hyXk!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477 1272w, https://substackcdn.com/image/fetch/$s_!hyXk!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!hyXk!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477" width="601" height="477" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:477,&quot;width&quot;:601,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;A diagram of embedding search in practice\n\nAI-generated content may be incorrect.&quot;,&quot;title&quot;:&quot;A diagram of embedding search in practice\n\nAI-generated content may be incorrect.&quot;,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="A diagram of embedding search in practice

AI-generated content may be incorrect." title="A diagram of embedding search in practice

AI-generated content may be incorrect." srcset="https://substackcdn.com/image/fetch/$s_!hyXk!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477 424w, https://substackcdn.com/image/fetch/$s_!hyXk!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477 848w, https://substackcdn.com/image/fetch/$s_!hyXk!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477 1272w, https://substackcdn.com/image/fetch/$s_!hyXk!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4cfbea7-8ab1-42ab-b268-80bc1e593dfe_601x477 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em><a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably">Semantic Search using dense embeddings (also known as vector/embedding/neural search/retrieval)</a></em></p><p>Is that &#8220;AI&#8221;?</p><blockquote><p>A quick terminology note: when I say &#8220;lexical&#8221; or &#8220;keyword&#8221; search, I&#8217;m referring to methods that match based on the actual words in your query and the documents. This includes both Boolean search (exact matching with AND/OR/NOT operators) and <a href="https://emschwartz.me/understanding-the-bm25-full-text-search-algorithm/">probabilistic methods like BM25 (which scores documents based on term frequency, document length, and how rare each term is across the corpus)</a>. These are related but distinct&#8212;Boolean gives you a set of matching documents, while BM25 gives you a ranked list. Most traditional academic databases like Scopus use Boolean first to retrieve a set of documents and then do relevance ranking with <a href="https://kmwllc.com/index.php/2020/03/20/understanding-tf-idf-and-bm-25/">BM25 (or the related TF-IDF)</a>. Neither attempts to understand semantic meaning as they just match strings. That said, it is common to stack a reranker on top of that which is trained using supervised learning (learning to rank model) on labelled click data. We will discuss this in the section on Semantic Scholar.</p></blockquote><p>Let&#8217;s take for granted that traditional information retrieval methods like Boolean and BM25 aren&#8217;t &#8220;AI&#8221; otherwise by default every search engine is AI!  </p><p>So what we&#8217;re saying is that anything that goes beyond traditional keyword matching&#8212;such as semantic search via embedding search/match&#8212;is considered &#8220;AI-powered search.&#8221; An example is <a href="https://support.jstor.org/hc/en-us/articles/34461819575831-Searching-Keyword-versus-Semantic-Results">JSTOR beta&#8217;s semantic results function</a>.  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!GmZT!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!GmZT!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png 424w, https://substackcdn.com/image/fetch/$s_!GmZT!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png 848w, https://substackcdn.com/image/fetch/$s_!GmZT!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png 1272w, https://substackcdn.com/image/fetch/$s_!GmZT!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!GmZT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png" width="921" height="750" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:750,&quot;width&quot;:921,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:73694,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!GmZT!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png 424w, https://substackcdn.com/image/fetch/$s_!GmZT!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png 848w, https://substackcdn.com/image/fetch/$s_!GmZT!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png 1272w, https://substackcdn.com/image/fetch/$s_!GmZT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9b6e119d-b6b1-4be8-b763-0ad63aa59850_921x750.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Note that all that changes is the relevancy algorithm. You still get a list of results (though <a href="https://aarontay.substack.com/p/the-case-of-the-vanishing-hit-count">embedding-based search usually only retrieves top K results rather than all hits like a Boolean search</a>). There is no generated answer.</p><blockquote><p>Embedding search is fantastic at understanding broad conceptual similarity, but it can be &#8216;fuzzy&#8217;&#8212;sometimes retrieving papers that feel related but miss the specific keywords or strict criteria you need. That is why it is common to do hybrid search combining  both methods</p></blockquote><p>A decade or two ago, more librarians would have heavily objected to non-keyword search methods because the results would be less explainable. (I suspect <a href="https://musingsaboutlibrarianship.blogspot.com/2012/05/how-is-google-different-from.html">two decades of using Google&#8217;s soft or fuzzy Boolean search and getting relevant results without all matching terms has weakened the resistance! </a>). These days I see more librarians (except systematic review specialists) accepting such retrieval methods, particularly if they improve recall or precision&#8212;even if it <a href="https://aarontay.substack.com/p/the-reproducibility-and">means losing both interpretability and often reproducibility</a>.</p><p>They&#8217;re often even more accepting when told the embeddings aren&#8217;t strictly &#8220;Large Language Models,&#8221; which now seems to be the bogeyman many people have in mind. But how different are they really?  </p><blockquote><p>Language models compute the conditional probability of a token given a context window, using these probabilities to sample and generate sequences. Embedding models, however, focus on representation learning, mapping input sequences to fixed-size vectors without an autoregressive generation component.</p></blockquote><p>That said these days the embeddings we use (e.g., BERT, SciBERT, SPECTER) are <em>transformer based encoder models</em> which are very close cousins to <em>the GPT style transformer based decoder models. (I will ignore encoder-decoder models)</em></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!KYpn!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!KYpn!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png 424w, https://substackcdn.com/image/fetch/$s_!KYpn!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png 848w, https://substackcdn.com/image/fetch/$s_!KYpn!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png 1272w, https://substackcdn.com/image/fetch/$s_!KYpn!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!KYpn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png" width="1456" height="971" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:971,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1840597,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!KYpn!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png 424w, https://substackcdn.com/image/fetch/$s_!KYpn!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png 848w, https://substackcdn.com/image/fetch/$s_!KYpn!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png 1272w, https://substackcdn.com/image/fetch/$s_!KYpn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F522a5959-0742-482c-bf13-03a47d3c5f50_1536x1024.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><strong>How decoder models (LLMs) are trained:</strong> GPT-style models are trained on massive text corpora using &#8220;next token prediction&#8221; (also known as causal language modelling)&#8212;given a sequence of words, predict what comes next. This autoregressive training is what enables them to generate fluent text. The model learns statistical patterns across billions of documents, building an implicit representation of language, facts, and reasoning patterns.</p><p><strong>How encoder models are trained: </strong>Models like BERT, SciBERT, and SPECTER use a different pretraining objective&#8212;&#8221;masked language modelling&#8221; or essentially a cloze test. Random words in a sentence are masked out, and the model learns to predict the missing words based on surrounding context. This bidirectional training (looking at context on both sides) produces rich representations of meaning, but the model isn&#8217;t designed to generate text&#8212;it outputs embeddings that capture semantic relationships.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ZFXe!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ZFXe!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!ZFXe!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!ZFXe!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!ZFXe!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ZFXe!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:144746,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ZFXe!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!ZFXe!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!ZFXe!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!ZFXe!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc126c038-10be-4d9a-baf3-498cd703260f_1024x559.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><blockquote><p>Historically, only encoder models were used as embedding models and while many modern embedding models (e.g., SBERT, E5, Gecko) are still based on transformer encoder architectures, recent top-performing embeddings models&#8212;like OpenAI's ada and Google's Gemini embeddings, e5 mistral etc&#8212;are derived from large decoder-based transformers. While decoder models are not naturally designed to output embeddings - they are meant to predict next token, with proper fine-tuning, decoder models can effectively generate embeddings, often excelling due to being derived from their larger base model size (decoder derived embedding tends to have billions of parameters instead of  hundreds of millions for encoder models ), though with higher energy costs </p></blockquote><p>The similarities are substantial. Both use the transformer architecture. Both are trained on large text corpora through self-supervised learning. Both learn distributed representations of language. The encoder/decoder distinction is primarily about the training objective and what the model outputs, not fundamental differences in how they learn from data.</p><p>This means that if your concern is intellectual property&#8212;where the training data comes from, whether it was used with permission, whether the model has &#8220;ingested&#8221; copyrighted works&#8212;the issues are largely the same for both model types. An encoder model trained on scraped academic papers raises similar provenance questions to a decoder model trained on the same corpus.</p><p><strong>However, there is one meaningful difference:</strong> encoder models do not reproduce text. They convert text into numerical vectors and compare those vectors. A decoder model, by contrast, can regenerate text that closely resembles its training data&#8212;this is the basis of concerns about LLMs reproducing copyrighted passages or memorising private information. Encoder models used for semantic search can only say "these two texts are semantically similar," - they don&#8217;t generate passages, so the plagiarism-style risk is lower.</p><p>So if your concern is specifically about text reproduction and the potential for plagiarism or copyright-infringing outputs, encoder-based semantic search is genuinely lower risk. If your concern is about the ethics of training on data without consent, the distinction offers less comfort.</p><p>There are also practical differences: embedding models tend to be much smaller and less energy-hungry than modern LLMs. And because we&#8217;re not generating answers, just doing relevance ranking, we avoid issues like citation faithfulness and <a href="https://bera-journals.onlinelibrary.wiley.com/doi/full/10.1111/bjet.13544?casa_token=iQsXd4R0hbgAAAAA%3AJXFnbkinwf2NpdMzKkIqdLxiiHj8kRmcaguLxZmYihWHflb2eC7x-vBa5m8H8MJWl594MMyvw9-hepKq">cognitive offloading.</a></p><p><strong>Level 3: LLMs for Retrieval and/or Relevance Ranking</strong></p><p>Okay, so maybe you&#8217;re comfortable with embeddings from encoder models and you are happy it doesn&#8217;t generate answers.  </p><p>What if the search engine uses an <a href="https://aarontay.substack.com/p/the-reproducibility-and">LLM to generate a Boolean search strategy and then runs keyword search as normal (e.g., Web of Science Research Assistant)?</a> <a href="https://aarontay.substack.com/p/the-reproducibility-and">Or does hybrid search where it first runs LLM-generated Boolean before reranking using embeddings (e.g., Primo Research Assistant)? Or does both LLM-generated Boolean plus embedding search together and reranks (e.g., Scopus AI)?</a>  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!atRx!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!atRx!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 424w, https://substackcdn.com/image/fetch/$s_!atRx!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 848w, https://substackcdn.com/image/fetch/$s_!atRx!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 1272w, https://substackcdn.com/image/fetch/$s_!atRx!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!atRx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png" width="1125" height="346" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:346,&quot;width&quot;:1125,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!atRx!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 424w, https://substackcdn.com/image/fetch/$s_!atRx!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 848w, https://substackcdn.com/image/fetch/$s_!atRx!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 1272w, https://substackcdn.com/image/fetch/$s_!atRx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbd44f5b6-6bef-4149-9b5b-5a003f579a2e_1125x346.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Or what if the system retrieves using keywords (or hybrid methods) then uses GPT-style LLMs to judge relevancy and generate ranking of the top K results?</p><p>When using LLMs for relevancy ranking, you can ask the LLM to:</p><ul><li><p>Give a score or categorise documents into relevancy tiers (point-wise comparison)</p></li><li><p>Compare relevancy of two documents (pair-wise comparison)</p></li><li><p>Provide a rank sort of multiple documents (list-wise comparison)</p></li></ul><p>You can also prompt the LLM to give a reason for the score or ranking.</p><p>Regardless of method, we&#8217;re now using those big decoder models&#8212;the ones everyone associates with &#8220;generative AI&#8221;&#8212;but we&#8217;re still just using them to rank search results (typically after a earlier retrieval phase to rank on promising candidates). No synthesis, no summarisation (except to explain reasoning for relevance), just ordering.</p><blockquote><p>Technical note: You can also use <a href="https://aarontay.substack.com/p/can-semantic-search-be-more">powerful but slow Cross-Encoder or late-interaction models like ColBERT </a> instead of outright GPT-style decoder models to get results almost as good as directly using a LLM. Functionally, with respect to ranking quality there is little difference but you do avoid the use of decoder LLMs and hence the ip risks.</p></blockquote><p><a href="https://scholar.googleblog.com/2025/11/scholar-labs-ai-powered-scholar-search.html?m=1">Google Scholar Labs, </a><a href="https://asta.allen.ai/discover?redirect_from=paper-finder">AI2 Paper Finder (now Asta)</a> uses this type of approach - it uses an LLM to do query intent parsing, rank results and even generate a rationale explaining <em>why</em> each paper was ranked where it was. You&#8217;re still ultimately getting a ranked list, but now there&#8217;s AI-generated explanatory text attached to each result.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!c5rp!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!c5rp!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png 424w, https://substackcdn.com/image/fetch/$s_!c5rp!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png 848w, https://substackcdn.com/image/fetch/$s_!c5rp!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png 1272w, https://substackcdn.com/image/fetch/$s_!c5rp!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!c5rp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png" width="1456" height="690" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:690,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:220779,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!c5rp!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png 424w, https://substackcdn.com/image/fetch/$s_!c5rp!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png 848w, https://substackcdn.com/image/fetch/$s_!c5rp!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png 1272w, https://substackcdn.com/image/fetch/$s_!c5rp!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0235c115-7a27-4b97-b44f-2605430eea18_1630x773.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Does this change things, because there is now actual generation of text to explain relevancy or will your objection be that it uses actual LLMs (decoder models) rather than just encoder models?</p><p></p><p><strong>Level 4: Synthesis and Generation Across Papers</strong></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Bqsr!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Bqsr!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png 424w, https://substackcdn.com/image/fetch/$s_!Bqsr!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png 848w, https://substackcdn.com/image/fetch/$s_!Bqsr!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png 1272w, https://substackcdn.com/image/fetch/$s_!Bqsr!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Bqsr!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png" width="1377" height="791" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:791,&quot;width&quot;:1377,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:149020,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Bqsr!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png 424w, https://substackcdn.com/image/fetch/$s_!Bqsr!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png 848w, https://substackcdn.com/image/fetch/$s_!Bqsr!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png 1272w, https://substackcdn.com/image/fetch/$s_!Bqsr!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fff09e8a6-9a99-45c9-923e-b795fac30be9_1377x791.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Now we&#8217;re getting into what many find most objectionable. This level encompasses two related approaches:</p><p>Quick RAG tools like Elicit, scite assistant, and Primo Research Assistant synthesise information across multiple papers to generate answers with citations, typically using Retrieval Augmented Generation. You ask a question, the system reads through papers, extracts relevant information, and writes you a summary with references. It&#8217;s not just ranking anymore&#8212;it&#8217;s creating new text based on the literature.</p><p><a href="https://aarontay.substack.com/p/why-i-think-academic-deep-research">Deep research tools</a> like <a href="http://undermind.ai">Undermind</a> and <a href="https://aarontay.substack.com/p/a-2025-deep-dive-of-consensus-promises">Consensus&#8217;s deep search mode</a> take this further&#8212;basically RAG on steroids. <a href="https://aarontay.substack.com/p/why-i-think-academic-deep-research">These systems don&#8217;t just synthesise a quick answer; they conduct extensive multi-step research processes, following leads, refining searches, and building comprehensive analyses that can run for minutes or even hours.</a>  </p><p>Both approaches share the same fundamental characteristic: the AI is generating novel text that synthesises across sources, not merely ranking or retrieving existing documents.</p><p>Leaving aside the use of LLMs, there are reasons to object to Level 4 tools:</p><ul><li><p><a href="https://www.rollingstone.com/culture/culture-features/ai-chatbot-journal-research-fake-citations-1235485484/">LLMs can produce ghost references</a> (<a href="https://aarontay.substack.com/p/why-ghost-references-still-haunt">though this can be mitigated</a>)</p></li><li><p><a href="https://retractionwatch.com/2025/11/19/ai-unreliable-identifying-retracted-research-papers-study/">Studies have reported LLMs citing retracted papers</a> (<a href="https://onlinelibrary.wiley.com/doi/10.1002/leap.2018">here</a> and <a href="https://preprints.jmir.org/preprint/88766">here</a>)</p></li><li><p>There are doubts whether LLMs can faithfully represent what each article says and properly weight findings when they disagree</p></li></ul><p> Even if these performance issues were mitigated, people also worry about the adverse effects of using and relying on such tools - e.g. <a href="https://www.sciencedirect.com/science/article/pii/S0747563224002541">cognitive offloading from overuse of these functions.</a></p><h2>Different Concerns, Different Red Lines</h2><p>Here&#8217;s the thing&#8212;there&#8217;s no objectively &#8220;right&#8221; answer about what counts as unacceptable AI use. But it&#8217;s crucial to be clear with yourself about what you&#8217;re actually concerned about, because different concerns lead to very different red lines.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!KSjx!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!KSjx!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png 424w, https://substackcdn.com/image/fetch/$s_!KSjx!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png 848w, https://substackcdn.com/image/fetch/$s_!KSjx!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png 1272w, https://substackcdn.com/image/fetch/$s_!KSjx!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!KSjx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png" width="782" height="634" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:634,&quot;width&quot;:782,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:79883,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!KSjx!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png 424w, https://substackcdn.com/image/fetch/$s_!KSjx!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png 848w, https://substackcdn.com/image/fetch/$s_!KSjx!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png 1272w, https://substackcdn.com/image/fetch/$s_!KSjx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F66f621db-7d06-4b0c-9046-44647c178ff9_782x634.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>If you&#8217;re worried about generative AI making students lazy, you might be perfectly fine with AI assistance as long as it&#8217;s just ranking results. Let the algorithms find relevant papers, but make students read and synthesise themselves.</p><p>If you&#8217;re worried about environmental impact or IP issues of huge GPT-style LLMs, you might accept encoder embeddings but draw a hard line at any use of GPT-type models.</p><p>If you&#8217;re worried about reproducibility or interpretability&#8212;and regular readers know this is my particular obsession&#8212;you might object to any non-Boolean/lexical methods, and maybe even AI-generated metadata.</p><p>If you&#8217;re worried about accuracy and hallucination, the earlier levels might be fine but synthesis crosses the line. Ranking can be imperfect without being catastrophically wrong, but generation creates new opportunities for confident-sounding nonsense.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!F504!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!F504!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 424w, https://substackcdn.com/image/fetch/$s_!F504!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 848w, https://substackcdn.com/image/fetch/$s_!F504!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!F504!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!F504!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg" width="1024" height="541" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:541,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:138031,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!F504!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 424w, https://substackcdn.com/image/fetch/$s_!F504!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 848w, https://substackcdn.com/image/fetch/$s_!F504!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!F504!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc49a343-b062-4e33-9d7d-b229fec9bddb_1024x541.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><h2>Where Do Common Tools Actually Sit?</h2><p>Given this framework, it&#8217;s worth examining where familiar platforms actually fall&#8212;because the answer isn&#8217;t always obvious.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!drir!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!drir!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png 424w, https://substackcdn.com/image/fetch/$s_!drir!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png 848w, https://substackcdn.com/image/fetch/$s_!drir!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png 1272w, https://substackcdn.com/image/fetch/$s_!drir!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!drir!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png" width="695" height="712" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:712,&quot;width&quot;:695,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:72588,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!drir!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png 424w, https://substackcdn.com/image/fetch/$s_!drir!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png 848w, https://substackcdn.com/image/fetch/$s_!drir!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png 1272w, https://substackcdn.com/image/fetch/$s_!drir!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6cccdac-ed36-4464-a5d7-19fa21a0b62e_695x712.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h3>The &#8220;Semantic Scholar&#8221; Confusion</h3><p>Here&#8217;s an irony worth noting: <a href="https://www.semanticscholar.org/me/research">Semantic Scholar&#8212;</a>the platform whose name suggests semantic search&#8212;doesn&#8217;t actually use vector embeddings for its main search retrieval - at least not <a href="https://www.semanticscholar.org/me/research">on the search on its home page</a> as of April 2025.</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!kIb5!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!kIb5!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png 424w, https://substackcdn.com/image/fetch/$s_!kIb5!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png 848w, https://substackcdn.com/image/fetch/$s_!kIb5!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png 1272w, https://substackcdn.com/image/fetch/$s_!kIb5!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!kIb5!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png" width="1456" height="315" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:315,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:66034,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:&quot;&quot;,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!kIb5!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png 424w, https://substackcdn.com/image/fetch/$s_!kIb5!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png 848w, https://substackcdn.com/image/fetch/$s_!kIb5!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png 1272w, https://substackcdn.com/image/fetch/$s_!kIb5!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b7043ed-cdc1-4e0a-b634-39e8a6002cc9_1768x383.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p><a href="https://arxiv.org/abs/2301.10140">According to a preprint updated April 2025</a>, the platform&#8217;s search operates in two stages: first, Elasticsearch retrieves up to 1,000 candidates using keyword matching (probably BM25); then these are reranked using a LightGBM model that emphasises direct title matches and highly-cited recent papers.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Aa6Y!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Aa6Y!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg 424w, https://substackcdn.com/image/fetch/$s_!Aa6Y!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg 848w, https://substackcdn.com/image/fetch/$s_!Aa6Y!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!Aa6Y!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Aa6Y!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg" width="876" height="377" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:377,&quot;width&quot;:876,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:&quot;&quot;,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!Aa6Y!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg 424w, https://substackcdn.com/image/fetch/$s_!Aa6Y!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg 848w, https://substackcdn.com/image/fetch/$s_!Aa6Y!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!Aa6Y!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7332a736-5da2-4d9b-92bf-25abff4b3570_876x377.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><blockquote><p>LightGBM is a gradient-boosted decision tree ranker&#8212;machine learning, but not a neural embedding model and not generative. It&#8217;s a feature-driven reranker sitting between BM25-style retrieval and modern transformer-heavy &#8220;AI search.&#8221;</p><p>More specifically, it&#8217;s supervised or semi-supervised learning model trained on labelled data (e.g., relevance judgments or interaction signals) to learn a scoring function that combines feature-based signals&#8212;query/field match strength, citations, publication year, etc.&#8212;into a final relevance score. </p><p>It&#8217;s typically used in a <strong>learning-to-rank&#8211;style</strong> setup (often with ranking objectives like LambdaRank), meaning it learns how to order candidate documents for a query rather than generate text. </p></blockquote><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!30Gn!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!30Gn!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png 424w, https://substackcdn.com/image/fetch/$s_!30Gn!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png 848w, https://substackcdn.com/image/fetch/$s_!30Gn!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png 1272w, https://substackcdn.com/image/fetch/$s_!30Gn!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!30Gn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png" width="738" height="496" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:496,&quot;width&quot;:738,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:415589,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:&quot;&quot;,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!30Gn!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png 424w, https://substackcdn.com/image/fetch/$s_!30Gn!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png 848w, https://substackcdn.com/image/fetch/$s_!30Gn!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png 1272w, https://substackcdn.com/image/fetch/$s_!30Gn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff70d29bf-1b34-4343-91d9-2bba5b1a4281_738x496.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>So where do the embeddings come in? Semantic Scholar developed SPECTER and <a href="https://huggingface.co/allenai/specter2">SPECTER2</a>, sophisticated document embedding models trained on citation graphs. But these power auxiliary features: research feed recommendations, author disambiguation, paper clustering, and finding related papers. The embeddings exist; they&#8217;re just not driving the core search experience.  </p><blockquote><p>There is one exception: their newer <strong>&#8220;snippet search&#8221; API endpoint</strong>, designed for retrieving text passages from the S2ORC corpus, does use a genuine hybrid approach. Passages are embedded using mxbai-embed-large-v1, and results are retrieved using the union of embedding-based and keyword-based matches, ranked by a weighted sum of embedding similarity and BM25 scores (Kinney et al., 2023). But this is a specialised API for full-text passage retrieval&#8212;not the main search you get from the<a href="https://www.semanticscholar.org/me/research"> Semantic Scholar Search bar </a>that most users encounter.</p></blockquote><p>You might be wondering why I am harping on this. After all, Semantic Scholar has many features that are clearly AI-powered, such as &#8220;TLDR&#8221;, &#8220;Ask this paper&#8221;, Citation sentiment (e.g., &#8220;Highly Influential Citations&#8221;), Research Feeds.</p><p>This matters because if you&#8217;re advising researchers, the name might reasonably lead you to assume you&#8217;re getting embedding-based semantic retrieval. In fact, I have seen quite a few libraries list Semantic Scholar in their libguides as &#8220;semantic/neural/vector search&#8221;. </p><p>You&#8217;re not&#8212;at least not in the primary interface. </p><p>This misunderstanding might then lead you to search using natural language rather than keyword, which typically works better in semantic retrieval systems. Unfortunately, this fails here. The query:</p><p><code>Is there an open access citation advantage</code></p><p>returns only 13 results (big underestimate), while keyword search even with quotes gets a more reasonable 54.</p><p> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!-Ot_!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!-Ot_!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 424w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 848w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 1272w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png" width="1190" height="304" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/cf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:304,&quot;width&quot;:1190,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:24772,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:&quot;&quot;,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!-Ot_!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 424w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 848w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 1272w, https://substackcdn.com/image/fetch/$s_!-Ot_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcf7db251-93f9-44ea-b8c2-68ba5021102d_1190x304.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!BxZ3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!BxZ3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png 424w, https://substackcdn.com/image/fetch/$s_!BxZ3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png 848w, https://substackcdn.com/image/fetch/$s_!BxZ3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png 1272w, https://substackcdn.com/image/fetch/$s_!BxZ3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!BxZ3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png" width="1099" height="290" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/a2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:290,&quot;width&quot;:1099,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!BxZ3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png 424w, https://substackcdn.com/image/fetch/$s_!BxZ3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png 848w, https://substackcdn.com/image/fetch/$s_!BxZ3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png 1272w, https://substackcdn.com/image/fetch/$s_!BxZ3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa2a41a4a-163f-4515-9059-ca7f981d4115_1099x290.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2><strong>Are OpenAlex or Lens.org AI-Powered?</strong></h2><p>Listing Semantic Scholar as &#8220;AI powered search&#8221; at least makes some sense because of many AI features. </p><p>On the other hand, I also notice quite a few LibGuides classify <a href="http://openalex.org">OpenAlex</a> and <a href="http://lens.org">Lens.org</a> as &#8220;AI powered/LLM search&#8221; or worse semantic/neural search. This is a much less defensible move. Both are pure lexical search engines with no LLM used in retrieval or ranking, and no synthesis features.</p><blockquote><p> New! <a href="https://blog.openalex.org/openalex-rewrite-enters-beta-%F0%9F%8E%89/#:~:text=Vector%20search%20endpoint%3A%20find%20relevant%20works%20and%20other%20entities%20based%20on%20semantic%20similarity%20of%20free%2Dform%20text">In the latest Walden update, OpenAlex is planning a Vector search endpoint: find relevant works and other entities based on semantic similarity of free-form text</a>.  <a href="https://blog.openalex.org/openalex-api-new-features-and-usage-based-pricing/">As of 24 Feb 2026, OpenAlex now has semantic search</a>.</p></blockquote><p>This is probably just a misunderstanding by some librarians as they became aware of Lens.org and OpenAlex only recently (<a href="https://about.lens.org/release-5-4-0/">Lens.org actually started going beyond Lens search with Scholarly search in Dec 2017</a>) and mistakenly assumed it was in the same class as newer search, but is there a way to argue they are &#8220;AI-powered&#8221; search engines?</p><p>Perhaps, you might argue that using AI to extract, cluster, or organise metadata makes a search engine &#8220;AI-powered.&#8221; and because we know OpenAlex uses machine learning for topic assignment and author disambiguation - it is AI-powered. </p><p>But the problem with this is that by this standard, even traditional databases like Scopus would qualify&#8212;they use clustering algorithms for author disambiguation and citation parsing.</p><p>You can try to draw a line to decide which methods are &#8220;AI&#8221; which are not (the same way we can with retrieval algos) and decide you&#8217;re okay with good old-fashioned machine learning or even embeddings if they are used to extract or clean up metadata but are not okay if LLMs are used.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!DvxY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!DvxY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png 424w, https://substackcdn.com/image/fetch/$s_!DvxY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png 848w, https://substackcdn.com/image/fetch/$s_!DvxY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png 1272w, https://substackcdn.com/image/fetch/$s_!DvxY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!DvxY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png" width="916" height="435" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:435,&quot;width&quot;:916,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:42645,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!DvxY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png 424w, https://substackcdn.com/image/fetch/$s_!DvxY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png 848w, https://substackcdn.com/image/fetch/$s_!DvxY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png 1272w, https://substackcdn.com/image/fetch/$s_!DvxY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc1e9bce-879d-4970-b03b-cc58ac9298d5_916x435.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><a href="https://substack.com/@researchmusings/p-179126788">Dimensions has a interesting post on the different types of &#8220;AI&#8221; (Symbolic AI, Discriminative AI, embeddings, knowledge graphs and even generative AI) employed under the hood for metadata</a>.  </p><blockquote><p>When you browse Dimensions to identify research funded by NIH, when publications from an author who moved affiliation are under the same profile, when a cluster gets labeled with a coherent name, this is Artificial Intelligence at work, although not all is Generative AI. So, what are the different flavours of AI and what do they do?</p></blockquote><p>But this whole thing sounds very contrived and I think most would agree use of &#8220;AI&#8221; for metadata handling should not count as AI-powered search engine.  </p><h2>What I&#8217;m Getting At</h2><p>I&#8217;m not trying to tell you where to draw your line. What I am saying is: watch out for knee-jerk reactions (my own included!) that treat &#8220;AI&#8221; as a monolithic thing we either accept or reject wholesale.</p><p>The field is rapidly developing systems that incorporate different types of AI at different layers, in different ways, for different purposes. Some of those uses might align with your values and needs. Others might not. But you can&#8217;t make that determination until you actually understand what&#8217;s under the hood.</p><p>And unfortunately, that&#8217;s often the hardest part&#8212;because many of these systems are black boxes that don&#8217;t clearly explain which AI techniques they&#8217;re using, where, or why. Which brings me back to my recurring theme: methodological transparency matters.</p><p>We can&#8217;t make informed decisions about what AI search tools to use (or refuse to use) if we don&#8217;t actually know what they&#8217;re doing.</p><p>So the next time you see an &#8220;AI-powered search engine,&#8221; maybe the first question shouldn&#8217;t be &#8220;Is this AI?&#8221; but rather &#8220;What kind of AI, &#8220;where and how it is used in the pipeline&#8221;.</p><h2>Appendix </h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!JR0k!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!JR0k!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg 424w, https://substackcdn.com/image/fetch/$s_!JR0k!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg 848w, https://substackcdn.com/image/fetch/$s_!JR0k!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!JR0k!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!JR0k!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg" width="1024" height="565" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/a84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:565,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:133501,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180945021?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!JR0k!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg 424w, https://substackcdn.com/image/fetch/$s_!JR0k!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg 848w, https://substackcdn.com/image/fetch/$s_!JR0k!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!JR0k!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa84dcdfd-c531-48dc-a778-ee3a6775254a_1024x565.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Questions to ask or think about for a AI-powered search</p><p><strong>A) Where is AI used in the pipeline?</strong></p><ol><li><p>Query formulation (query rewriting, Boolean drafting)</p></li><li><p>Retrieval (candidate generation)</p></li><li><p>Ranking (reranking / learning-to-rank / LLM judging)</p></li><li><p>Result enrichment (snippets, TLDRs, explanations)</p></li><li><p>Synthesis (multi-document answer)</p></li></ol><p><strong>B) What kind of AI model is used there?</strong></p><ul><li><p>classic IR (Boolean/BM25)</p></li><li><p>&#8220;traditional&#8221; ML (e.g., boosted trees / LTR -Learning to Rank)</p></li><li><p>embeddings (encoder models; dense/sparse)</p></li><li><p>generative LLMs (decoder; possibly multimodal)</p></li></ul><p><em>Images generated with help of Gemini 3 Pro</em></p>]]></content:encoded></item><item><title><![CDATA[Why Ghost References Still Haunt Us in 2025—And Why It's Not Just About LLMs]]></title><description><![CDATA[Ghost references existed long before LLMs. This post examines how Google Scholar's [CITATION] mechanism and web pollution may undermine RAG verification.]]></description><link>https://aarontay.substack.com/p/why-ghost-references-still-haunt</link><guid isPermaLink="false">https://aarontay.substack.com/p/why-ghost-references-still-haunt</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Mon, 22 Dec 2025 19:23:37 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!mrx3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mwHv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mwHv!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg 424w, https://substackcdn.com/image/fetch/$s_!mwHv!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg 848w, https://substackcdn.com/image/fetch/$s_!mwHv!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!mwHv!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mwHv!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg" width="800" height="800" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:800,&quot;width&quot;:800,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mwHv!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg 424w, https://substackcdn.com/image/fetch/$s_!mwHv!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg 848w, https://substackcdn.com/image/fetch/$s_!mwHv!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!mwHv!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fed218ee3-83d6-4769-b3fe-cda2df671af0_800x800.jpeg 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee! (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee! (via ko-fi)</span></a></p><p>As early as late 2022, I understood that Retrieval Augmented Generation (RAG) would be the future. By grounding LLM responses in retrieved content, RAG should reduce or even eliminate certain types of hallucinations&#8212;including the dreaded ghost reference: citations to papers that simply do not exist.</p><p>To be clear about terms:</p><ul><li><p><strong>Ghost reference:</strong> a citation to a work that <em>does not exist</em>.</p></li><li><p><strong>Citation unfaithfulness:</strong> a citation to a <em>real</em> work that doesn&#8217;t actually support the claim being made.</p></li><li><p><strong>&#8220;Existing&#8221; or &#8220;real&#8221; reference: </strong>A work you can point to, access, or verify exists. Quality is not guaranteed&#8212;such a work might be a legitimate but retracted paper (a &#8220;<a href="https://www.science.org/content/article/zombie-papers-wont-die-retracted-papers-notorious-fraudster-still-cited-years-later">zombie citation</a>&#8221;) or a product of paper mills, which these days often but not always means a fully AI-generated paper. Nevertheless, it still counts as &#8220;existing&#8221; in this context. An &#8220;existing&#8221; paper or reference might also make ghost references.</p></li></ul><p>In the early days of ChatGPT (GPT-3.5 era), ghost references were common because these tools (or at the free versions) didn&#8217;t perform web searches to ground their outputs - which was akin to asking a human to cite papers without searching to verify to confirm if they &#8220;remembered&#8221; the reference correctly. But that&#8217;s no longer true for most modern systems which search the web and perform Retrieval Augmented Generation (see image below  generated by NanoBanana Pro). </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mrx3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mrx3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 424w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 848w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mrx3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg" width="1024" height="565" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:565,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:96460,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/182180407?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mrx3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 424w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 848w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!mrx3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F84b6be18-92f6-44ff-9bdf-9148d4c9edb7_1024x565.jpeg 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>While, this problem of ghost references seems to be no longer a serious issue at my institution, a quick scan of librarian blogs and social media <a href="https://www.rollingstone.com/culture/culture-features/ai-chatbot-journal-research-fake-citations-1235485484/">suggest this problem is still a huge issue</a>. Why is this?</p><p>I think, the answer is more uncomfortable than &#8220;LLMs hallucinate&#8221; </p><p>The answer lies in a troubling interaction between two vulnerabilities. </p><p>The first is architectural: Google Scholar creates [CITATION] records for references it cannot match to actual documents. These stubs&#8212;inferred from bibliographies rather than verified sources&#8212;allow fabricated references to accumulate citations and apparent legitimacy from humans and possibly LLM alike. </p><p>The second is that RAG systems using general web search can be fooled by this and similar pollution. When an LLM searches the web to verify a citation, it may find pages that themselves cite the ghost reference, concluding the paper must be real.</p><p>In short, ghost references are not primarily an LLM/GenAI phenomenon. They have always existed, propagated by entirely human mechanisms&#8212;typos, careless copying, citing without reading. What LLM/GenAI has done is accelerate and amplify a pre-existing structural vulnerability in scholarly communication infrastructure. The web is already contaminated; RAG with web search inherits that contamination.</p><p> </p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><h2>How Academic RAG Actually Prevents Ghost References</h2><p>I noticed early on that academic RAG and Deep Research tools largely solved the ghost reference problem. <a href="https://www.researchgate.net/publication/383988574_Correctness_and_Quality_of_References_generated_by_AI-based_Research_Assistant_Tools_The_Case_of_Scopus_AI_Elicit_SciSpace_and_Scite_in_the_Field_of_Business_Administration">A 2023 thesis demonstrated that even basic early academic RAG systems like Scopus AI, Elicit, and SciSpace do not fabricate references</a>. </p><p>Minor citation errors still occur, but these typically originate from upstream metadata issues&#8212;think of how Google Scholar sometimes displays incorrect publication years due to merging preprints with the version of record.</p><h3>Going deeper into how RAG generate citations</h3><p>LLMs do not naturally cite the text chunks they retrieve, and even if they did, how do you guard against cases where they don&#8217;t follow instructions? However, there are architectural approaches that can virtually guarantee zero fabricated citations. Here is one such method (see image below generated by Nano Banana Pro): </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!eVya!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!eVya!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png 424w, https://substackcdn.com/image/fetch/$s_!eVya!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png 848w, https://substackcdn.com/image/fetch/$s_!eVya!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png 1272w, https://substackcdn.com/image/fetch/$s_!eVya!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!eVya!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png" width="1193" height="661" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:661,&quot;width&quot;:1193,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1094774,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/182180407?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!eVya!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png 424w, https://substackcdn.com/image/fetch/$s_!eVya!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png 848w, https://substackcdn.com/image/fetch/$s_!eVya!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png 1272w, https://substackcdn.com/image/fetch/$s_!eVya!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fad20bdd0-4363-4861-ba07-475d337747d1_1193x661.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><strong>Step 1: Unique ID Assignment.</strong> The database assigns a unique identifier to each document chunk. When chunks are retrieved in response to a query, they carry these identifiers along with their text.</p><p>For example, given the query </p><p><code>&#8220;Which library is the oldest public branch library in Singapore?&#8221;</code></p><p>the retrieval step might return:</p><ul><li><p><code>&lt;text chunk 1&gt; [UniqueID-XYAD]</code></p></li><li><p><code>&lt;text chunk 2&gt; [UniqueID-QASD]</code></p></li><li><p><code>First public branch library in Singapore was in Queenstown [UniqueID-XXXX]</code></p></li></ul><p><strong>Step 2: ID-Only Citation Generation. </strong>The LLM is prompted and fine-tuned to generate text with only the unique ID&#8212;not the full citation. For instance, it might produce the following:</p><p><code>Singapore&#8217;s oldest public branch library is in Queenstown [UniqueID-XXXX].</code></p><p><strong>Step 3: Post-Hoc Verification. </strong>A non-LLM method (typically python script) verifies that each generated unique ID matches a retrieved document and exists in the database. This catches any hallucinated identifiers.</p><p><strong>Step 4: Programmatic Citation Replacement</strong>. Finally, a deterministic process (such as regular expressions with Python Script) replaces each unique ID with the full, verified citation or metadata. We do not trust the LLM to generate complete citations because it might hallucinate details.</p><p>This architecture virtually eliminates ghost references, as it never gets a chance to invent citation metadata. That said it cannot prevent unfaithful statements&#8212;claims that misrepresent what the cited work actually says. Various methods exist to detect unfaithful claims (e.g. <a href="https://arxiv.org/pdf/2408.12398">entailment-based verification</a>), but none are foolproof. </p><p>Critically, this approach works because academic RAG systems perform retrieval over a <em>known, curated, and bounded</em> corpus. General-purpose LLMs searching the open web cannot easily adopt this strategy&#8212;and therein lies part of the problem.  </p><h2>Ghost References Have Always Existed before the use of LLMs  </h2><p>Someone shared with me the following Bluesky post.</p><div class="bluesky-wrap outer" style="height: auto; display: flex; margin-bottom: 24px;" data-attrs="{&quot;postId&quot;:&quot;3mae7iq3ccc2n&quot;,&quot;authorDid&quot;:&quot;did:plc:rl2szulxujlgdcmx4avx7jyn&quot;,&quot;authorName&quot;:&quot;Ben Williamson&quot;,&quot;authorHandle&quot;:&quot;benpatrickwill.bsky.social&quot;,&quot;authorAvatarUrl&quot;:&quot;https://cdn.bsky.app/img/avatar/plain/did:plc:rl2szulxujlgdcmx4avx7jyn/bafkreidfafo4bhtukpq3w25eluxnkln7im4recvjkenvwjafje4rlaec5m@jpeg&quot;,&quot;text&quot;:&quot;And so checked out Google Scholar. Now on my profile it doesn't appear, but somwhow on Nelli's it does and ... and ... omg, IT'S BEEN CITED 42 TIMES almost exlusively in papers about AI in education from this year alone... scholar.google.com.vn/citations?vi...&quot;,&quot;createdAt&quot;:&quot;2025-12-19T17:25:33.173Z&quot;,&quot;uri&quot;:&quot;at://did:plc:rl2szulxujlgdcmx4avx7jyn/app.bsky.feed.post/3mae7iq3ccc2n&quot;,&quot;imageUrls&quot;:[]}" data-component-name="BlueskyCreateBlueskyEmbed"><iframe id="bluesky-3mae7iq3ccc2n" data-bluesky-id="6067351007543675" src="https://embed.bsky.app/embed/did:plc:rl2szulxujlgdcmx4avx7jyn/app.bsky.feed.post/3mae7iq3ccc2n?id=6067351007543675" width="100%" style="display: block; flex-grow: 1;" frameborder="0" scrolling="no"></iframe></div><p>This <a href="https://bsky.app/profile/benpatrickwill.bsky.social/post/3mae76wc7ts2n">Bluesky post</a> <a href="https://scholar.google.com/scholar?cluster=1795648861839846375&amp;hl=en&amp;inst=14102473421921925766&amp;oi=scholarr">highlighted a ghost reference that had accumulated 43 citations in Google Scholar</a>. The &#8220;paper&#8221; appeared as a [CITATION] entry &#8212;a type of Google Scholar record we&#8217;ll examine in detail shortly. </p><p>While works in roughly the same topic by the purported authors exist (for instance, <a href="https://www.tandfonline.com/doi/full/10.1080/17439884.2018.1556215">Williamson &amp; Piattoeva published on related topics in 2019</a> and a <a href="https://www.taylorfrancis.com/chapters/edit/10.4324/9780429341359-7/objectivity-standardization-data-scientific-education-policy-technology-governance-ben-williamson-nelli-piattoeva">2020 book chapt</a>er), this specific reference does not correspond to any real publication.  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!8Q6K!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!8Q6K!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png 424w, https://substackcdn.com/image/fetch/$s_!8Q6K!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png 848w, https://substackcdn.com/image/fetch/$s_!8Q6K!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png 1272w, https://substackcdn.com/image/fetch/$s_!8Q6K!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!8Q6K!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png" width="914" height="270" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:270,&quot;width&quot;:914,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:25033,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/182180407?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!8Q6K!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png 424w, https://substackcdn.com/image/fetch/$s_!8Q6K!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png 848w, https://substackcdn.com/image/fetch/$s_!8Q6K!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png 1272w, https://substackcdn.com/image/fetch/$s_!8Q6K!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F174cd047-7897-497e-af41-2a3d8e185a7a_914x270.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I suspect most people initially assumed this from a LLM hallucinated reference that had propagated through the system. But my response hinted that this might not necessarily be the case. </p><p>Regardless of the initial source of the error, the Google Scholar practice of generating [CITATION] records is quite dangerous, as we shall see, this practice can &#8220;pollute&#8221; the web.</p><p>Examining the citing articles revealed something important: citations to this ghost reference came from papers <em>supposedly published in 2019 and 2021!</em></p><p>This was years before ChatGPT&#8217;s widespread adoption in late 2022 and while GPT 2 (2019) and GPT 3 (2020) was a thing, it was unlikely to be the cause of a 2019 or even 2021 citing paper.</p><p>This complicates the easy narrative that GenAI created the ghost reference problem. These early citations were likely produced by humans through entirely traditional mechanisms:</p><ul><li><p>Typographical errors that propagated</p></li><li><p>Careless copying of reference lists without verification</p></li><li><p>Conflating two similar papers into one that doesn&#8217;t exist</p></li><li><p>Simply misremembering a paper</p></li></ul><p>That said, one can easily see the offending citing papers are from very poor quality sources, so we can&#8217;t even be sure if the publication dates are correct! </p><p>Still, I won&#8217;t be surprised if at least some of them are really just errors from humans. </p><p>This shouldn&#8217;t surprise us. The empirical literature on citation practices has long documented these patterns.<a href="https://arxiv.org/abs/cond-mat/0212043"> Simkin and Roychowdhury&#8217;s influential studies estimated that only about 20% of citers actually read the original papers they cite</a>&#8212;the rest probably copy references from other papers&#8217; bibliographies (Simkin &amp; Roychowdhury, 2003). Related are studies about academic paper urban legends - where claims like <a href="https://harzing.com/publications/white-papers/myth-busted-most-academic-research-does-get-cited">most papers are not cited are asserted by misrepresenting papers</a> - all of this was done pre-GPT!</p><p>In the particular topic under discussion, it seems <a href="https://www.sciencedirect.com/science/article/pii/S0740624X17300473?via%3Dihub">we also have evidence that ghost references are common (pre-GPT)</a>.</p><p>But as you will see later, more recent ghost references might perhaps be LLM/GenAI related.</p><h2>Why &#8220;RAG + web search&#8221; doesn&#8217;t reliably prevent ghost references</h2><p>When I asked <a href="https://chatgpt.com/share/69466f82-2f48-800a-a37d-053cd0608cf7">the free version of ChatGPT (currently GPT-5.2 Instant) to locate the ghost reference</a> from the Bluesky post, it<a href="https://www.scirp.org/reference/referencespapers?referenceid=4104419&amp;utm_source=chatgpt.com"> confidently claimed the paper existed and pointed to what appeared to be a source</a>. That source? A webpage from another journal that itself had cited the ghost reference.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!lKNI!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!lKNI!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png 424w, https://substackcdn.com/image/fetch/$s_!lKNI!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png 848w, https://substackcdn.com/image/fetch/$s_!lKNI!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png 1272w, https://substackcdn.com/image/fetch/$s_!lKNI!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!lKNI!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png" width="1220" height="600" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:600,&quot;width&quot;:1220,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!lKNI!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png 424w, https://substackcdn.com/image/fetch/$s_!lKNI!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png 848w, https://substackcdn.com/image/fetch/$s_!lKNI!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png 1272w, https://substackcdn.com/image/fetch/$s_!lKNI!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F858f29d9-28ff-4473-874f-91a44f344d6b_1220x600.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This is perhaps part of the reason why GPT still generates ghost references even with web search?</p><p>To be fair, the paid version of <a href="https://chatgpt.com/share/69467081-c9c4-800a-aeca-81c3dd9c2199">ChatGPT (GPT-5.2 with thinking) occasionally identified the paper as fake by locating the original Bluesky post from the authors. </a>But results were inconsistent&#8212;different prompts yielded different conclusions. </p><blockquote><p>It is unclear to me if LLMs could be taught to try to verify papers the way we librarians and researchers do it (imagine connecting to MCP sources like Crossref, PubMed) and can say things like this reference looks fishy, as the DOI doesn&#8217;t match or there seems to be no trace of a journal article (beyond appearance in references) that should be easily found. </p></blockquote><p>The broader lesson: LLMs with general web search can fail to reliably verify references because the web itself contains fake citations. </p><p>This creates a feedback loop. A ghost reference (either human or LLM generated) gets cited by a real paper. That paper appears online. An LLM finds the citation and concludes the reference must be real. The ghost becomes increasingly entrenched.</p><p>This is the <a href="https://xkcd.com/978">&#8220;citogenesis&#8221; phenomenon famously illustrated by XKCD</a>.  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Nwjl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Nwjl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png 424w, https://substackcdn.com/image/fetch/$s_!Nwjl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png 848w, https://substackcdn.com/image/fetch/$s_!Nwjl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png 1272w, https://substackcdn.com/image/fetch/$s_!Nwjl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Nwjl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png" width="538" height="614" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:614,&quot;width&quot;:538,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Citogenesis&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Citogenesis" title="Citogenesis" srcset="https://substackcdn.com/image/fetch/$s_!Nwjl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png 424w, https://substackcdn.com/image/fetch/$s_!Nwjl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png 848w, https://substackcdn.com/image/fetch/$s_!Nwjl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png 1272w, https://substackcdn.com/image/fetch/$s_!Nwjl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ff90156-3d6c-4279-9a28-00e38e5ccedf_538x614.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This occurs when Wikipedia errors propagate into published sources and back again. Reference list errors in influential papers get copied by subsequent authors who don&#8217;t verify their sources. A typo becomes a &#8220;paper&#8221; that dozens of researchers claim to have read.</p><p>Similarly, once a ghost reference appears (human or LLM generated), this citogenesis process can be accelerated by both LLMs and careless humans.</p><p><em>The scary bit is this, even if LLMs from here on out do not hallucinate ghost references &#8220;on their own&#8221; and always take backing from web sources, they may still run find existing ghost references and maybe cite them! </em></p><p>What&#8217;s changed is not the existence of ghost references but their potential scale and discoverability. GenAI can produce more content, faster, with confident-sounding citations. And when verification is attempted using LLMs with web search, those tools can be fooled by the pre-existing pollution that humans created over decades.</p><p>I want to be careful here: we don&#8217;t yet have good empirical data on how much GenAI has increased the rate of ghost reference creation. This is an important research question. What we can say is that the architectural conditions exist for acceleration, even if quantifying the actual increase remains difficult.</p><h2>Why Google Scholar practice of creating [citation] records is dangerous in this day and age</h2><p>To understand the structural vulnerability at play, we need to examine how citation indexes are constructed.  I always recommend librarians and researchers to understand how citation indexes are created because it explains a lot of issues with citation counts.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!BJEl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!BJEl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png 424w, https://substackcdn.com/image/fetch/$s_!BJEl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png 848w, https://substackcdn.com/image/fetch/$s_!BJEl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png 1272w, https://substackcdn.com/image/fetch/$s_!BJEl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!BJEl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png" width="1175" height="615" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:615,&quot;width&quot;:1175,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:920556,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/182180407?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!BJEl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png 424w, https://substackcdn.com/image/fetch/$s_!BJEl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png 848w, https://substackcdn.com/image/fetch/$s_!BJEl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png 1272w, https://substackcdn.com/image/fetch/$s_!BJEl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fef319864-6acc-4de3-8798-06ffe9c34f4d_1175x615.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Citation indexes follow a four-step pipeline:</p><p><strong>1. Collect. </strong>Citation indexes covers a defined set of works. Even Google Scholar, as broad as it is, focuses on &#8220;scholarly work.&#8221; So step one is to gather a defined set of works&#8212;specific journals, conference proceedings, book chapters, etc. Most well-known citation indexes focus on journal articles and, to a lesser extent, conference proceedings, book chapters, and occasionally preprints (for broader, more open ones).</p><p><strong>2. Extract.</strong> The system analyzes each collected work to identify its bibliography, pulling out reference strings in indexed works e.g.</p><p><code>Small, H. (1973). Co-citation in the scientific literature: A new measure of the relationship between two documents. Journal of the American Society for Information Science, 24(4), 265&#8211;269. https://doi.org/10.1002/asi.4630240406 </code> </p><p><strong>3. Match. </strong>This is the most technically complex step. The system attempts to link extracted references to works already in its database. This is not straight forward. Cited references exhibit enormous variation &#8211; some issues</p><ul><li><p>Author name variants (initials, transliterations, name changes)</p></li><li><p>Journal title abbreviations (inconsistent or non-standard)</p></li><li><p>Typographical errors in the original references</p></li><li><p>Incomplete citation</p></li></ul><p>Matching algorithms must balance precision and recall&#8212;too strict and you create false negatives (cited works lose citations); too loose and you create false positives (incorrect links).</p><p><strong>4. Total. </strong>The system aggregates links to quantify influence, producing the citation counts researchers use to gauge impact.</p><p>In short, citation indexes transform static reference lists into dynamic, countable links, converting individual documents into a networked web of scholarship.</p><p>Step 3&#8212;matching&#8212;is the least understood yet most critical part of this process. What happens when an extracted reference cannot be matched to any existing work in the database?</p><h2>The Google Scholar [Citation] Vulnerability</h2><p>When an indexed work contains reference strings that don&#8217;t match anything in your index, one option is to do nothing.</p><p>But Google Scholar&#8217;s answer to unmatched references is instead to create<em> [Citation] records</em>&#8212;entries that appear when GS detects a reference in an indexed paper&#8217;s bibliography but cannot locate the actual source document.</p><p>These are essentially citation stubs: metadata records inferred from parsed reference lists rather than from direct indexing of primary documents. </p><p>Key characteristics include:</p><ul><li><p>The title appears with a &#8220;[CITATION]&#8221; prefix and typically isn&#8217;t hyperlinked to full text.</p></li><li><p>Metadata is often incomplete or inaccurate (missing authors, incorrect dates, truncated titles) because it&#8217;s reconstructed from how other papers cited the work.</p></li><li><p>They lack abstracts since Google Scholar never accessed the original document.</p></li><li><p>They still accumulate citation counts&#8212;which is actually their primary function.</p></li></ul><p>This mechanism serves legitimate purposes. An unmatched reference might represent a real work that simply isn&#8217;t indexed by Google Scholar: perhaps a print-only source, a work behind paywalls GS cannot penetrate, or simply a typo that prevented matching. For instance, referencing &#8220;Tay, C.H. (2020)&#8221; when the actual author is &#8220;Tay, C.L. (2020)&#8221; would cause matching to fail. </p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!aukl!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!aukl!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png 424w, https://substackcdn.com/image/fetch/$s_!aukl!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png 848w, https://substackcdn.com/image/fetch/$s_!aukl!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png 1272w, https://substackcdn.com/image/fetch/$s_!aukl!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!aukl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png" width="1281" height="313" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:313,&quot;width&quot;:1281,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:30332,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/182180407?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!aukl!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png 424w, https://substackcdn.com/image/fetch/$s_!aukl!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png 848w, https://substackcdn.com/image/fetch/$s_!aukl!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png 1272w, https://substackcdn.com/image/fetch/$s_!aukl!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c549f27-cfea-4cb7-80f6-bf2892c3a141_1281x313.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>My own Medium posts have legitimate [CITATION] entries because they&#8217;ve been cited by indexed scholarly works despite not being &#8220;scholarly&#8221; content that GS would directly index.</p><p>But the [CITATION] mechanism has always been a structural vulnerability. It allows fabricated references&#8212;whether created by human error or GenAI hallucination&#8212;to enter the scholarly communication system with an appearance of legitimacy. <em>Once a [CITATION] record exists and accumulates citations, it becomes increasingly difficult to distinguish from a real paper that simply isn&#8217;t available online.</em></p><p>I don&#8217;t believe Google Scholar creates a [CITATION] record for every unmatched reference&#8212;there&#8217;s likely some threshold, such as multiple indexed works citing the same reference.</p><p><em>But once a ghost reference clears that threshold and a Google Scholar [citation] record is created, the citogenesis cycle accelerates. Careless researchers (and LLMs with web search) see the [CITATION] record, assume the paper exists, and cite it themselves.</em></p><blockquote><p>Google Scholar has extremely tight anti-bot features, so LLMs usually cannot search and &#8220;see&#8221; the [CITATION] record directly. But once that record exists on the web, there are numerous ways for it to &#8220;leak out&#8221;&#8212;through library discovery systems, reference management tools, and academic social networks that surface Google Scholar metadata. </p><p>A good example, is a journal or ebook with ghost references on a platform that offers link resolver links. The system will create a library link resolver link that when clicked brings the user to a library catalog record that looks like a real record you can ask for ILL or Document Delivery!</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!3N2q!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!3N2q!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png 424w, https://substackcdn.com/image/fetch/$s_!3N2q!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png 848w, https://substackcdn.com/image/fetch/$s_!3N2q!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png 1272w, https://substackcdn.com/image/fetch/$s_!3N2q!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!3N2q!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png" width="1152" height="599" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/19296dfb-7802-4278-88d3-8684647d3121_1152x599.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:599,&quot;width&quot;:1152,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:33068,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/182180407?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!3N2q!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png 424w, https://substackcdn.com/image/fetch/$s_!3N2q!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png 848w, https://substackcdn.com/image/fetch/$s_!3N2q!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png 1272w, https://substackcdn.com/image/fetch/$s_!3N2q!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19296dfb-7802-4278-88d3-8684647d3121_1152x599.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This is a <a href="https://search.library.smu.edu.sg/discovery/openurl?institution=65SMU_INST&amp;vid=65SMU_INST:SMU_NUI&amp;ctx_ver=Z39.88-2004&amp;rft.genre=article&amp;ctx_enc=info:ofi%2Fenc:UTF-8&amp;url_ver=Z39.88-2004&amp;url_ctx_fmt=infofi%2Ffmt:kev:mtx:ctx&amp;rfr_id=info:sid%2Fprimo.exlibrisgroup.com:primo4-article-cLinker&amp;rft_val_fmt=info:ofi%2Ffmt:kev:mtx:article&amp;isCitationLinker=Y&amp;lang=en&amp;rft.date=2022&amp;rft.atitle=Education%20governance%20and%20datafication&amp;rft.jtitle=Education%20and%20Science&amp;rft.volume=27&amp;rft.issue=&amp;rft.spage=3515&amp;rft.epage=3531&amp;rft.issn=&amp;rft.doi=&amp;rft.pmid=&amp;rft.aulast=&amp;rft.aufirst=&amp;rft.auinit=&amp;rft.publisher=&amp;rft.pubdate=">sample record produced in my institution&#8217;s catalogue generated by a ghost reference on a platform that has link resolver links </a></p></blockquote><p>This vulnerability existed long before GenAI. The 2019 citations to our example ghost reference prove that. What GenAI changes is the rate at which new ghost references can be generated and how quickly they can propagate across the web, making citation verification increasingly difficult.</p><h1>Are Academic RAG Tools Safe from This Problem?</h1><p>Given the problems with general web search, this is precisely why we turn to academic RAG and Deep Research tools like Elicit, Consensus, and Undermind. They don&#8217;t retrieve over the open web but instead query curated sources like Semantic Scholar and OpenAlex. </p><p><a href="https://aarontay.substack.com/p/mcp-servers-and-academic-search-the">Similarly, LLMs with MCP connectors to trusted content sources like PubMed or Wiley</a> avoid web pollution by querying authoritative databases directly.</p><p>But are these tools immune to the ghost reference problem?</p><p>Most AI search startups without their own data sources rely on Semantic Scholar, OpenAlex, or some combination of web scraping and partnerships. While more inclusive than Scopus, we can be reasonably assured that works in these indexes are &#8220;real&#8221; in some sense. OpenAlex (prior to the <a href="https://docs.google.com/document/d/1SPZ7QFcPddCHYt1pZP1UCIuqbfBY22lSHwgPA8RQyUY/edit?tab=t.0">Walden update</a>) only indexed works it could match with Crossref records.</p><p>Important caveats apply: <em>existence says nothing about quality</em>. A work could exist as a PDF, on a preprint server, even have a DOI, and yet still be a paper that is entirely AI-generated&#8212;potentially including references to papers that don&#8217;t exist. But at least the indexed work in OpenAlex itself does &#8220;exist&#8221;.</p><p>The critical architectural difference is how these indexes handle unmatched references. Unlike Google Scholar, OpenAlex and Semantic Scholar appear to only display references that can be matched against indexed works (with an OpenAlex ID or equivalent).</p><blockquote><p>Two of the most popular commercial citation indexes&#8212;Scopus and Web of Science&#8212;actually allow searching of unmatched reference strings via the somewhat obscure &#8220;<a href="https://support.clarivate.com/ScientificandAcademicResearch/s/article/Web-of-Science-Using-the-Cited-Reference-Search-to-find-articles-that-cite-the-same-two-references?language=en_US">Cited Reference Search</a>&#8221; and &#8220;<a href="https://service.elsevier.com/app/answers/detail/a_id/11423/supporthub/scopus/#panel14">Secondary documents</a>&#8221; features respectively. Does OpenAlex or Semantic Scholar have something similar?</p></blockquote><p><strong>They do not create [Citation] records for unmatched references.</strong></p><p>This is an important safeguard. </p><p>Leaving aside LLM web search finding such records, as more tools such as Undermind.ai, Consensus Deep Search, implement citation-chaining in Deep Search functionality, this design choice prevents them from surfacing and amplifying fabricated references that exist only as the equalvant of [citation] stubs.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!AGQZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!AGQZ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png 424w, https://substackcdn.com/image/fetch/$s_!AGQZ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png 848w, https://substackcdn.com/image/fetch/$s_!AGQZ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png 1272w, https://substackcdn.com/image/fetch/$s_!AGQZ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!AGQZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png" width="751" height="823" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:823,&quot;width&quot;:751,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:64788,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/182180407?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!AGQZ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png 424w, https://substackcdn.com/image/fetch/$s_!AGQZ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png 848w, https://substackcdn.com/image/fetch/$s_!AGQZ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png 1272w, https://substackcdn.com/image/fetch/$s_!AGQZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7a724003-1bb4-4639-b7ac-7227a5cc3584_751x823.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h3>The Loose Matching Problem</h3><p>A warning remains: while these indexes won&#8217;t create new records for ghost references, their matching algorithms may incorrectly link ghost references to existing real works if the algorithms are too permissive. </p><p>Consider a ghost reference generated by LLM or human with slightly garbled metadata. An overly loose matching algorithm might incorrectly link it to a real paper with a similar title or author. The ghost reference doesn&#8217;t create a new stub&#8212;instead, it incorrectly inflates the citation count of an existing work and creates a false trail that future researchers might follow.</p><p>The ghost reference that started this investigation had 43 citations, likely from a combination of </p><ul><li><p>humans finding the Google Scholar [Citation] record and citing it </p></li><li><p>humans copying references from papers containing the ghost reference</p></li><li><p>LLMs finding &#8220;evidence&#8221; of such records on webpages and citing it </p></li><li><p>LLMs hallucinating (in the traditional sense) variant forms of the ghost reference and being linked through loose matching algorithms.</p></li><li><p>It has been suggested that these human errors might be in the pretraining of LLMs leading them to generate such ghost references, I don&#8217;t think this is likely - such errors appears in a tiny fraction of training data&#8212;far too infrequent to reliably influence generation.</p></li></ul><p>I haven&#8217;t seen empirical work directly testing this hypothesis. It would be interesting to check whether known historical ghost references appear at elevated rates in LLM outputs compared to base rates in the literature.</p><h2>The Missing Layer: Editorial and Peer Review Responsibility</h2><p>The infrastructural focus of this analysis is important, but we shouldn&#8217;t neglect the human gatekeeping failures that allow ghost references to propagate.</p><p>Reference verification should be part of editorial and peer review processes. In practice, it rarely is. Reviewers focus on methodology, argumentation, and contribution&#8212;not on whether every cited work actually exists. Copy editors check formatting consistency, not ontological validity.</p><p>This is understandable given time constraints, but it means that the scholarly communication system lacks a verification layer at the point where it might be most effective. By the time a ghost reference appears in a published paper, it has already gained legitimacy.</p><p>Some journals have begun using automated reference checking tools, but these typically verify formatting and DOI resolution rather than comprehensive existence checks. A reference to a non-existent paper without a DOI would sail through.</p><p>As ghost references potentially become more common, publishers and editors may need to invest in more robust verification infrastructure&#8212;or accept that the scholarly record will become increasingly polluted.</p><p></p><h2>Conclusion: A Pre-Existing Condition, Now Acute</h2><p>The persistence of ghost references in 2025 may not just be a story about LLM randomly hallucinating ghost references for no reason. </p><p>Academic RAG systems that retrieve from curated databases and use proper citation verification have largely solved this problem at the technical level.</p><p>The real story is older and more uncomfortable. Ghost references have always existed, created and propagated by human sloppiness: typos, careless copying, citing without reading, conflating similar papers. The scholarly communication infrastructure&#8212;particularly Google Scholar&#8217;s [Citation] mechanism&#8212;has long had structural vulnerabilities that allow these fabrications to persist and accumulate apparent legitimacy.</p><p>What GenAI changes is the scale and the difficulty of detection. LLMs can generate ghost references faster than humans ever could. And when we try to verify references using LLMs with web search, those tools are fooled by the pre-existing pollution that humans created over decades. The contamination feeds on itself.</p><p>This has several practical implications:</p><p><strong>For researchers: </strong>Treat Google Scholar [Citation] records with heightened suspicion&#8212;but recognise this was always good practice, not just a GenAI-era precaution. If you cannot access the full text of a work, verify its existence through multiple authoritative sources before citing it. The existence of a Google Scholar entry&#8212;even one with many citations, even one that predates ChatGPT&#8212;does not guarantee that a work is real.</p><p><strong>For librarians: </strong>When teaching information literacy, the traditional lesson was to prefer Google Scholar over general web search because it indexes &#8220;scholarly&#8221; content. This guidance needs to be updated with education about whar [citation] records are and how to handle them.</p><p><strong>For tool and citation index developers: </strong>The choice not to create placeholder records for unmatched references (or at least not make them easily discoverable)&#8212;as OpenAlex and Semantic Scholar have made&#8212;is a design decision with significant implications for research integrity. As citation-chaining becomes more common in AI search tools, this architectural choice becomes increasingly important. </p><p><em>Even though you can filter such records out in Google Scholar, they might consider whether [Citation] records need additional friction, warnings, or provenance indicators.</em></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!xS65!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!xS65!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png 424w, https://substackcdn.com/image/fetch/$s_!xS65!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png 848w, https://substackcdn.com/image/fetch/$s_!xS65!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png 1272w, https://substackcdn.com/image/fetch/$s_!xS65!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!xS65!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png" width="393" height="385" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:385,&quot;width&quot;:393,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:12507,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/182180407?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!xS65!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png 424w, https://substackcdn.com/image/fetch/$s_!xS65!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png 848w, https://substackcdn.com/image/fetch/$s_!xS65!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png 1272w, https://substackcdn.com/image/fetch/$s_!xS65!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd19fdebc-4ca7-4ae3-a31f-3a87da54de45_393x385.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><strong>For researchers studying scholarly communication: </strong>We need better empirical data on this phenomenon. How has the rate of ghost reference creation changed post-2023? How do different citation indexes handle unmatched references, and what are the downstream effects? How do ghost references propagate through citation networks, and can we detect them algorithmically? The pre-GenAI literature on citation errors and &#8220;academic urban legends&#8221; provides a foundation, but the landscape may have shifted significantly.</p><p>The ghost reference problem is a chronic condition that has become acute. The infection predates GenAI; the technology has simply lowered our immune response while accelerating transmission. The cure lies not in blaming LLMs but in understanding&#8212;and shoring up&#8212;the structural vulnerabilities in scholarly infrastructure that have allowed ghost references to propagate for far longer than we&#8217;d like to admit.</p>]]></content:encoded></item><item><title><![CDATA[Deep Research, Shallow Agency: What Academic Deep Research Can and Can't Do]]></title><description><![CDATA[The Agentic Illusion: Most Academic Deep Research runs fixed workflows and stumble when given unfamiliar literature review tasks that do not fit them.]]></description><link>https://aarontay.substack.com/p/how-agentic-are-academic-deep-research</link><guid isPermaLink="false">https://aarontay.substack.com/p/how-agentic-are-academic-deep-research</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Mon, 08 Dec 2025 18:33:33 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!rdcp!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F50216806-ad06-4152-b637-85af53f8e5ad_1024x559.jpeg" length="0" type="image/jpeg"/><content:encoded><![CDATA[<p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee! (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee! (via ko-fi)</span></a></p><h2>Introduction</h2><p>When AI academic search tools promise &#8220;research agents&#8221; and &#8220;AI assistants,&#8221; do we know exactly are they offering? What types of literature review tasks do these &#8220;agents&#8221; and &#8220;assistants&#8221; support? Are they able to reason flexibly, use the tools at their disposal to accomplish tasks like human research assistants? </p><p>I ran a simple test&#8212;asking tools to find papers that <em>should</em> have been cited by a given article but weren&#8217;t&#8212;and discovered something revealing: most fail completely.  </p><p>Why do &#8220;agents&#8221; or &#8220;Research Assistants&#8221; fail such a simple task?  </p><p>In short, we find that while today&#8217;s Academic Deep Re/search tools are impressive&#8212;they are mostly <strong>workflow-bound</strong>, not fully autonomous agents. They are closer to systems that execute pre-built scripts with AI decision points&#8212;not use human-level reasoning to flexibly achieve the goal.</p><p>So yes, these are agents in a technical sense. But calling them &#8220;research assistants&#8221; or &#8220;agentic&#8221; systems risks misrepresenting their limitations&#8212;especially for novel or off-template tasks not covered by the default workflows.</p><h2>The Definition Problem</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ga1K!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ga1K!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png 424w, https://substackcdn.com/image/fetch/$s_!ga1K!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png 848w, https://substackcdn.com/image/fetch/$s_!ga1K!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png 1272w, https://substackcdn.com/image/fetch/$s_!ga1K!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ga1K!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png" width="1456" height="910" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:910,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:231388,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ga1K!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png 424w, https://substackcdn.com/image/fetch/$s_!ga1K!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png 848w, https://substackcdn.com/image/fetch/$s_!ga1K!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png 1272w, https://substackcdn.com/image/fetch/$s_!ga1K!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb646c7f0-8461-496d-bad4-8e75e15c016e_1749x1093.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>We now have <a href="https://aarontay.substack.com/p/why-i-think-academic-deep-research">four distinct quadrants of AI search tools</a>:</p><p><strong>Quick Search</strong>: Conventional single-shot search (lexical, semantic, or hybrid) showing ranked results. Examples: most traditional databases, Scopus, Google Scholar.</p><p><strong>Quick RAG:</strong> Single-shot retrieval plus short generated answer. Examples:  <a href="https://knowledge.exlibrisgroup.com/Primo/Product_Materials/001_Next_Discovery_Experience_(NDE)/Primo_Research_Assistant">Primo Research Assistant</a>, <a href="https://scite.ai/assistant">Scite Assistant (to some degree)</a>.</p><p><strong>Deep Search</strong>: Iterative retrieval taking minutes, with LLM relevance ranking, returning ranked results. Examples: <a href="https://asta.allen.ai/chat">AI2 Paperfinder (now Asta)</a>, <a href="https://scholar.google.com/scholar_labs/search?hl=en">Scholar Labs.</a></p><p><strong>Deep Research</strong>: Deep Search plus report generation. Examples: <a href="https://www.undermind.ai/">Undermind</a>, <a href="https://elicit.com/">Elicit Reports</a>, <a href="https://consensus.app/">Consensus Deep Search</a>.</p><p>But where does &#8220;agentic search&#8221; or agents that search fit? I&#8217;ve been implying that Deep (Re)search is synonymous with agentic search. Is this actually true?</p><p>While the <a href="https://gist.github.com/simonw/beaa5f90133b30724c5cc1c4008d0654#response">definition of &#8220;agent&#8221; has been hotly debated in the AI industry</a>. <a href="https://simonwillison.net/2025/Sep/18/agents/">one technical definition gaining traction</a> is simply to say</p><blockquote><p>An LLM agent runs tools in a loop to achieve a goal.</p></blockquote><p>or as<a href="https://www.anthropic.com/engineering/effective-context-engineering-for-ai-agents"> defined by Anthropic</a> - agents are </p><blockquote><p>LLMs autonomously using tools in a loop</p></blockquote><p>By the &#8220;LLM using tools in a loop&#8221; definition, virtually all Deep Search and Deep Research tools ARE agents&#8212;they use LLMs to make decisions, call tools (search APIs, citation networks), evaluate results, and iterate. AI2 Paperfinder, Elicit, Consensus Deep Search, Undermind&#8212;all qualify.</p><p>Case closed? Not quite.</p><h2>Autonomy or Agentic Behavior is a spectrum</h2><p>Anthropic defines agents as LLMs <em>autonomously</em> using tools in a loop but there are different degrees of autonomy or agency that could be given to the LLMs.</p><p>Imagine at one end of the spectrum we have </p><p><strong>100% Handcrafted systems : </strong>These systems follow predetermined workflows. The LLM makes decisions at specific points, but the workflow structure is fixed by human designers. Think of it as a decision tree: sophisticated, yes, but anticipated in advance.</p><p>At the other end we have </p><p><strong>100% Flexible systems:</strong> These systems reason from scratch about how to accomplish a task. Given a novel request, they devise an approach dynamically, combining available tools as needed to try to accomplish the goal.</p><p>Indeed one early analysis of <a href="https://leehanchung.github.io/blogs/2025/02/26/deep-research/">Deep Research tools</a> proposed this very distinction. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!2PSH!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!2PSH!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png 424w, https://substackcdn.com/image/fetch/$s_!2PSH!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png 848w, https://substackcdn.com/image/fetch/$s_!2PSH!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png 1272w, https://substackcdn.com/image/fetch/$s_!2PSH!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!2PSH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png" width="1456" height="819" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:819,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;alt text&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="alt text" title="alt text" srcset="https://substackcdn.com/image/fetch/$s_!2PSH!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png 424w, https://substackcdn.com/image/fetch/$s_!2PSH!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png 848w, https://substackcdn.com/image/fetch/$s_!2PSH!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png 1272w, https://substackcdn.com/image/fetch/$s_!2PSH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7da757b8-8095-44a8-b791-884cb538fea1_1600x900.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>A clear example of a handcrafted system is <a href="https://allenai.org/blog/paper-finder">Allen Institute for AI&#8217;s PaperFinder</a>. They makes this explicit when describing their <a href="https://allenai.org/blog/paper-finder">Paperfinder architecture as a &#8220;semi-rigid flow: a predefined structure that is influenced at key points by various LLM decisions.&#8221;</a> They acknowledge: &#8220;Of course, it would be cool if the LLM component were more dynamic and allowed more autonomy in how it influences the flow.&#8221;</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p>In comparison, tools like <strong>OpenAI Deep Research</strong> sit much closer to the <em>trained / autonomous</em> end of the spectrum than most academic &#8220;Deep Search&#8221; products.</p><p>Where a workflow-based tool like AI2 Paperfinder follows a predefined sequence (query analyser &#8594; router &#8594; sub-flow A/B/C, etc.), Deep Research behaves more like a <strong>general-purpose research agent</strong>:</p><ul><li><p>It starts from a natural language prompt:</p></li></ul><blockquote><p>&#8220;Write a detailed literature review on X, highlighting key debates and gaps.&#8221;</p></blockquote><ul><li><p>It <strong>plans</strong> its own work: decomposes the task into subtasks (e.g., &#8220;define scope&#8221;, &#8220;gather sources&#8221;, &#8220;cluster perspectives&#8221;, &#8220;draft sections&#8221;).</p></li><li><p>It <strong>chooses tools dynamically</strong>: web search, citation lookups, summarisation, comparison, checking contradictions, etc.</p></li><li><p>It <strong>adjusts the plan on the fly</strong> if it hits coverage gaps, conflicting evidence, or poor sources.</p></li><li><p>Unlike LLMs that have fixed workflows, the same prompt can be handled very differently (e.g. might use different set of tools) due to the non-deterministic nature of LLMs </p></li></ul><blockquote><p>These types of systems tend to be trained with reinforcement learning  </p></blockquote><p><em>This spectrum of agency or autonomy captures something crucial</em>. Most current academic Deep Search and Deep Research tools sit firmly on the handcrafted end: sophisticated workflows, yes, but workflows that human designers anticipated in advance. The LLM&#8217;s role is to make intelligent choices within the workflow&#8212;not to design the workflow itself.</p><p><em>Which means such tools will almost certainly fail when asked to do tasks that don&#8217;t fit neatly into those predetermined workflows</em>. Worse, they may still return results&#8212;it may not even be obvious that the system has failed until you examine the output carefully.</p><blockquote><p>Of course, one could argue<strong> The &#8220;LLM + tools in loop&#8221; definition is too permissive a defintion for agents or agentic behavior.</strong> Perhaps tools like AI2 Paperfinder are &#8220;agentic systems/frameworks&#8221; to<em> automate </em>certain tasks as opposed to being actual agents with agentic behavior. But there is no right definition!</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!laBL!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!laBL!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png 424w, https://substackcdn.com/image/fetch/$s_!laBL!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png 848w, https://substackcdn.com/image/fetch/$s_!laBL!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png 1272w, https://substackcdn.com/image/fetch/$s_!laBL!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!laBL!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png" width="741" height="147" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:147,&quot;width&quot;:741,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:14342,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!laBL!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png 424w, https://substackcdn.com/image/fetch/$s_!laBL!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png 848w, https://substackcdn.com/image/fetch/$s_!laBL!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png 1272w, https://substackcdn.com/image/fetch/$s_!laBL!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F87ce4236-e8eb-4e24-8fab-3bf10084c16b_741x147.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p></p></blockquote><p></p><h2>Does the &#8220;agentic&#8221; or &#8220;research assistant&#8221; framing lead to misunderstandings?</h2><p>Many of these AI literature review or AI powered tools have adopted marketing language, <em>that may suggest advanced autonomous capabilities</em>&#8212; by either talking about &#8221;research agents&#8221; if not about &#8220;research assistants&#8221;.</p><blockquote><p>I am not pointing fingers at particular players, pretty much all of them do similar marketing.</p></blockquote><p>Consider these framings:</p><p><a href="https://help.consensus.app/en/articles/12641232-scholar-agent">Consensus</a></p><blockquote><p>Scholar Agent is your personal research assistant in Consensus, built into Pro and Deep search modes. It goes beyond quick summaries by performing multi-step searches, applying rigorous academic filters, and surfacing deeper insights, trends, and key papers-fast.</p></blockquote><p>Undermind.ai homepage is more restrained on their homepage but you <a href="https://allenai.org/blog/paper-finder">see on their Y Combinator tagline they also invoke the &#8220;agent&#8221; idea</a></p><blockquote><p>An AI agent for scientific research</p></blockquote><p>Meanwhile, pretty much every tool even if it avoids the &#8220;Agentic&#8221; language - positions their tool as a &#8220;research assistant&#8221; (e.g. Elicit.com, Clarivate products).</p><p>This language&#8212;&#8221;research assistant,&#8221; &#8220;agent,&#8221; &#8220;multi-step reasoning&#8221;&#8212;implies flexibility. It suggests that given any literature review task, these systems can devise an approach, just as a human research assistant would.</p><p>But if the underlying architecture is handcrafted workflows, users will inevitably encounter tasks that fall outside those workflows&#8212;and be surprised when the system fails.</p><h2>How autonomous or flexible is your agent?</h2><p>Any AI search tool can find papers on a topic fitting some criteria. But can they handle this simple task?  </p><p><code>Find me papers that could/should have been cited by Paper X but were not.</code></p><p>A human research assistant would immediately devise a plan:</p><ol><li><p>Find papers on the same topic as X, filtered by publication year</p></li><li><p>Extract the references from Paper X</p></li><li><p>Report papers found in step 1 that don&#8217;t appear in step 2</p></li></ol><p>This requires no specialized knowledge&#8212;just the ability to reason about task structure and combine tools appropriately (well within reach of the reasoning capabilities of modern LLMs). I also choose this task because many Academic Deep Research tools like Undermind.ai, Consensus Deep Search, all claim the ability to do citation searching.</p><p>It&#8217;s precisely the kind of task that reveals whether a system has flexible reasoning or merely executes handcrafted workflows.</p><p>We may expect that these LLM &#8220;agents&#8221; or &#8220;research assistants&#8221; when given a task to reason from scratch and &#8220;decide&#8221; what to do with the tools they have.  Systems with fixed workflows will probably fail, unless the designers had anticipated such tasks and created a workflow in advance for this (unlikely).</p><p>I tested this using an open access paper: &#8220;<a href="https://peerj.com/articles/4375/">The state of OA: a large-scale analysis of the prevalence and impact of Open Access articles</a>.&#8221; My prompt:</p><p><code>find the paper &#8220;The state of OA: a large-scale analysis of the prevalence and impact of Open Access articles.&#8221; Then, identify papers that are related to this paper that could have been cited but are not cited by it</code></p><p>The paper is open access, so failure wouldn&#8217;t result from access restrictions. It has a relatively comprehensive bibliography, so randomly suggesting papers wouldn&#8217;t work.</p><p>For the system to succeed, it needs to have the capability to access the paper, extract its references, find related papers, and compare and filter. </p><p>Most importantly, it needs either a predefined workflow for this specific task (unlikely) or the ability to reason flexibly about combining available tools.</p><p>See Appendix for more details on the tests.</p><h2>The Results</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!tRYC!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!tRYC!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png 424w, https://substackcdn.com/image/fetch/$s_!tRYC!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png 848w, https://substackcdn.com/image/fetch/$s_!tRYC!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png 1272w, https://substackcdn.com/image/fetch/$s_!tRYC!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!tRYC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png" width="877" height="516" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:516,&quot;width&quot;:877,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:29625,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!tRYC!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png 424w, https://substackcdn.com/image/fetch/$s_!tRYC!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png 848w, https://substackcdn.com/image/fetch/$s_!tRYC!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png 1272w, https://substackcdn.com/image/fetch/$s_!tRYC!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5ce8a5ad-92a2-4ca7-ab10-9d120873f85c_877x516.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>General-purpose LLMs succeeded. Claude Sonnet&#8212;<a href="https://claude.ai/share/89dbcc1b-61e0-4b0b-b24c-e31538420552">even the free version with default web search</a> without <a href="https://aarontay.substack.com/p/mcp-servers-and-academic-search-the">specialised MCP connectors to gain access to academic or even paywalled content like Wiley AI Gateway or Pubmed</a> &#8212;reasoned through the task structure, identified the paper, extracted references, found related work, and filtered appropriately. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!bn2q!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!bn2q!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png 424w, https://substackcdn.com/image/fetch/$s_!bn2q!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png 848w, https://substackcdn.com/image/fetch/$s_!bn2q!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png 1272w, https://substackcdn.com/image/fetch/$s_!bn2q!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!bn2q!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png" width="863" height="698" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/db21db52-b3c3-4946-850f-304ea67492a7_863x698.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:698,&quot;width&quot;:863,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:93979,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!bn2q!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png 424w, https://substackcdn.com/image/fetch/$s_!bn2q!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png 848w, https://substackcdn.com/image/fetch/$s_!bn2q!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png 1272w, https://substackcdn.com/image/fetch/$s_!bn2q!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb21db52-b3c3-4946-850f-304ea67492a7_863x698.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Some suggestions were tangentially related (the obvious ones were already cited), but it clearly understood and executed the task logic.  . </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!9zBG!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!9zBG!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png 424w, https://substackcdn.com/image/fetch/$s_!9zBG!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png 848w, https://substackcdn.com/image/fetch/$s_!9zBG!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png 1272w, https://substackcdn.com/image/fetch/$s_!9zBG!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!9zBG!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png" width="747" height="747" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:747,&quot;width&quot;:747,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:137665,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!9zBG!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png 424w, https://substackcdn.com/image/fetch/$s_!9zBG!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png 848w, https://substackcdn.com/image/fetch/$s_!9zBG!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png 1272w, https://substackcdn.com/image/fetch/$s_!9zBG!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab71c1a1-7fc0-42fd-a524-02ecaada9bc0_747x747.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><strong>GPT models</strong> similarly succeeded when I tested them months ago. </p><p><strong>Gemini</strong> and <strong>GPT-5.1</strong> currently struggle, but primarily due to access issues (they claim to be blocked from full-text). Uploading the PDF directly works.</p><blockquote><p>Notably, I used these LLMs in standard mode, not Deep Research mode. Deep Research modes should work as well unless they trigger predetermined workflows rather than flexible reasoning.</p></blockquote><p>In conclusion, almost all top general-purpose LLMs sit on the trained/flexible end of the spectrum: they reason from scratch about each prompt and devise approaches dynamically.</p><h3>Most Specialized Academic Deep Search/Research Tools Fail</h3><p><a href="https://asta.allen.ai/share/31671682-5133-4798-b0e6-c11d81fad90c">AI2 Paperfinder</a> has a pretty <a href="https://allenai.org/blog/paper-finder">transparent workflow in their blog post</a>, so I asked Gemini 3 to extract the workflow and generate a flow diagram using Nano Banana Pro and this was the result.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!QIS9!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!QIS9!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png 424w, https://substackcdn.com/image/fetch/$s_!QIS9!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png 848w, https://substackcdn.com/image/fetch/$s_!QIS9!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png 1272w, https://substackcdn.com/image/fetch/$s_!QIS9!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!QIS9!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png" width="1055" height="1491" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1491,&quot;width&quot;:1055,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1621306,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!QIS9!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png 424w, https://substackcdn.com/image/fetch/$s_!QIS9!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png 848w, https://substackcdn.com/image/fetch/$s_!QIS9!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png 1272w, https://substackcdn.com/image/fetch/$s_!QIS9!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffd2f4c-41a2-492b-bff1-beafcba74bcc_1055x1491.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>[Update April 2026] I updated the image using the details mentioned in a more recent <a href="https://arxiv.org/pdf/2510.21652">2026 paper appendix F3 </a>that describes the inner-workings of a &#8220;frozen-in-time subset of the PaperFinder subcomponent of the Asta project (&#8221;the PaperFinder Product&#8221;)" </p><p>While the diagram above may not be 100% correct, it gives you a big picture view of what is happening. </p><blockquote><p>This looks very complicated but currently &#8220;<a href="https://arxiv.org/pdf/2510.21652">PaperFinder agent works as a pipeline of manual coded steps which involve LLM decisions</a>&#8221; and they found &#8220;<a href="https://arxiv.org/pdf/2510.21652">manual-coding approach to be more efficient (in terms of number of LLM calls, number of tokens, and in terms of the ability to parallelize) and more reliable than a more dynamic process that grants more autonomy to the LLM in several key-points</a>&#8221;</p></blockquote><p>Important to note is that <a href="https://allenai.org/blog/paper-finder#:~:text=Our%20current%20implementation%20routes%20to%20one%20of%20several%20pre%2Ddefined%20sub%2Dflows%3A%20specific%20paper%20search%2C%20semantic%20search%20with%20potential%20metadata%20constraints%2C%20pure%2Dmetadata%20queries%2C%20and%20queries%20that%20involve%20an%20author%20name.">AI2 Paperfinder (now Find paper in Asta) tries to direct your input to one of several subflows including &#8220;specific paper search, semantic search with potential metadata constraints, pure-metadata queries, and queries that involve an author name.&#8221;</a> (In the above flowchart, they correspond to navigational queries, semantic queries and metadata queries)</p><p>When given <a href="https://asta.allen.ai/share/31671682-5133-4798-b0e6-c11d81fad90c">my query </a> it naturally considered it as a simple <a href="https://allenai.org/blog/paper-finder#:~:text=Our%20current%20implementation%20routes%20to%20one%20of%20several%20pre%2Ddefined%20sub%2Dflows%3A%20specific%20paper%20search%2C%20semantic%20search%20with%20potential%20metadata%20constraints%2C%20pure%2Dmetadata%20queries%2C%20and%20queries%20that%20involve%20an%20author%20name.">specific paper lookup</a> and stopped once it found the target article.  It had no capability of going further.</p><p>Consensus Deep Search <a href="https://consensus.app/search/find-the-paper-the-state-of-oa-a-large-scale-analy/AWF-M7w4QMCaFnB-9rFw-g/">also failed</a>&#8212;despite <a href="https://openai.com/index/consensus/#:~:text=Built%20on%20GPT%E2%80%915%20and%20the%20Responses%20API%2C%20the,determines%20structure%20and%20visuals%2C%20and%20composes%20the%20final%20output">using GPT5 to act as four different sub-agents (planning Agent, Search Agent, Reading Agent, Analysis Agent) </a>and returned papers that were already cited. </p><p>In the end, it was designed for a fixed and specific workflow, as you can see from the user interface where it does the same steps no matter the query.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!MkX0!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!MkX0!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png 424w, https://substackcdn.com/image/fetch/$s_!MkX0!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png 848w, https://substackcdn.com/image/fetch/$s_!MkX0!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png 1272w, https://substackcdn.com/image/fetch/$s_!MkX0!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!MkX0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png" width="561" height="873" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b2914feb-f935-432e-9290-17ea7cb21845_561x873.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:873,&quot;width&quot;:561,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:55206,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!MkX0!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png 424w, https://substackcdn.com/image/fetch/$s_!MkX0!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png 848w, https://substackcdn.com/image/fetch/$s_!MkX0!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png 1272w, https://substackcdn.com/image/fetch/$s_!MkX0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb2914feb-f935-432e-9290-17ea7cb21845_561x873.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>EDIT: In fact the same query usually leads to slightly different steps and searches but you can&#8217;t still do anything besides doing a bunch of searches (with some citation searching), dedupe and rerank.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!f964!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!f964!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png 424w, https://substackcdn.com/image/fetch/$s_!f964!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png 848w, https://substackcdn.com/image/fetch/$s_!f964!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png 1272w, https://substackcdn.com/image/fetch/$s_!f964!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!f964!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png" width="561" height="899" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:899,&quot;width&quot;:561,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:62690,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!f964!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png 424w, https://substackcdn.com/image/fetch/$s_!f964!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png 848w, https://substackcdn.com/image/fetch/$s_!f964!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png 1272w, https://substackcdn.com/image/fetch/$s_!f964!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc43c859-4c34-48d6-b8d3-c825b4688dc1_561x899.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>You get even more visibility of what is going on bu looking at the <a href="https://openai.com/index/consensus/">Agent Flow Diagram on OpenAI&#8217;s webpage!</a>  You can tell there is not much hope as it is using a pretty rigid structure.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!x55F!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!x55F!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp 424w, https://substackcdn.com/image/fetch/$s_!x55F!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp 848w, https://substackcdn.com/image/fetch/$s_!x55F!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp 1272w, https://substackcdn.com/image/fetch/$s_!x55F!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!x55F!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp" width="1456" height="2349" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2349,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Agent flow diagram showing how a user query is processed through planning, parallel search, reading, and analysis agents to generate a research-based output.&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Agent flow diagram showing how a user query is processed through planning, parallel search, reading, and analysis agents to generate a research-based output." title="Agent flow diagram showing how a user query is processed through planning, parallel search, reading, and analysis agents to generate a research-based output." srcset="https://substackcdn.com/image/fetch/$s_!x55F!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp 424w, https://substackcdn.com/image/fetch/$s_!x55F!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp 848w, https://substackcdn.com/image/fetch/$s_!x55F!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp 1272w, https://substackcdn.com/image/fetch/$s_!x55F!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc33413a6-3f6e-49a9-9d82-e787bb19783e_1868x3014.webp 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Undermind asked clarifying questions that seemed promising,  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!W-UY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!W-UY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png 424w, https://substackcdn.com/image/fetch/$s_!W-UY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png 848w, https://substackcdn.com/image/fetch/$s_!W-UY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png 1272w, https://substackcdn.com/image/fetch/$s_!W-UY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!W-UY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png" width="686" height="892" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bb9c9516-0733-4639-b4cb-1392789cd286_686x892.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:892,&quot;width&quot;:686,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!W-UY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png 424w, https://substackcdn.com/image/fetch/$s_!W-UY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png 848w, https://substackcdn.com/image/fetch/$s_!W-UY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png 1272w, https://substackcdn.com/image/fetch/$s_!W-UY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbb9c9516-0733-4639-b4cb-1392789cd286_686x892.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>giving you the impression it could handle the request</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!wwCL!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!wwCL!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png 424w, https://substackcdn.com/image/fetch/$s_!wwCL!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png 848w, https://substackcdn.com/image/fetch/$s_!wwCL!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png 1272w, https://substackcdn.com/image/fetch/$s_!wwCL!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!wwCL!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png" width="602" height="194" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:194,&quot;width&quot;:602,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!wwCL!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png 424w, https://substackcdn.com/image/fetch/$s_!wwCL!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png 848w, https://substackcdn.com/image/fetch/$s_!wwCL!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png 1272w, https://substackcdn.com/image/fetch/$s_!wwCL!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc73bb869-c7db-411d-ab6e-d32e47d4ebdb_602x194.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>It <a href="https://app.undermind.ai/report/60edd77bd62af0aee9633157eb7229d875c1d83d5e9618130561f8964f106d35">doesn&#8217;t work of course</a>, it finds many related papers but most are cited already.</p><p>Because we have the least information about Undermind&#8217;s internals, I tried other tests e.g. Find me papers that cite or reference paper X but are before 2015, and here the LLM helps to clarify intent often warns you the system can not do the task you want!</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!AuAR!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!AuAR!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png 424w, https://substackcdn.com/image/fetch/$s_!AuAR!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png 848w, https://substackcdn.com/image/fetch/$s_!AuAR!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png 1272w, https://substackcdn.com/image/fetch/$s_!AuAR!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!AuAR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png" width="631" height="612" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:612,&quot;width&quot;:631,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:43920,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!AuAR!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png 424w, https://substackcdn.com/image/fetch/$s_!AuAR!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png 848w, https://substackcdn.com/image/fetch/$s_!AuAR!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png 1272w, https://substackcdn.com/image/fetch/$s_!AuAR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72ab6a77-c512-45bf-aab9-4669f11866f1_631x612.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Elicit Research Reports can&#8217;t succeed because its workflow is fixed: search &#8594; generate inclusion criteria &#8594; screen &#8594; extract. There&#8217;s no step for &#8220;check if paper is already cited in source document.&#8221;</p><p>In short, all of the Academic Deep Search and Deep Research failed because their &#8220;agents&#8221; are all working fixed defined flows and none of them had a flow predesigned for my task.</p><p></p><h2>Why Handcrafted Workflows Aren&#8217;t Bad</h2><p>While it seems like a more autonomous, more agentic system is clearly superior to one with handcrafted, pre-determined flows, it&#8217;s not as clear-cut as it looks.</p><p><strong>Speed and efficiency:</strong> Fixed workflows are dramatically faster. Undermind and Consensus Deep Search complete comprehensive searches in 8-10 minutes. Flexible deep research tools like OpenAI&#8217;s Deep Research and Gemini Deep Research take 20-30 minutes for comparable tasks. When you know the workflow in advance, you can parallelize operations, pre-optimize queries, and avoid reasoning overhead.</p><blockquote><p>Part of the reason why this difference is seen might also have to do with the different way these two classes of tools access data, with OpenAI/Gemini Deep Research tending to use slower more &#8220;real time&#8221; methods.</p></blockquote><p> </p><p><strong>Reliability and consistency: </strong>Fixed workflows produce predictable outputs. Flexible reasoning introduces variance&#8212;sometimes brilliantly adaptive, sometimes nonsense attempts. For researchers needing dependable results, workflow constraints makes things more predictable.</p><p><strong>Cost management: </strong>Open-ended agent loops are expensive. Each LLM call costs tokens; each API call costs money and time. Predefined workflows bound resource consumption predictably. A truly flexible agent might run dozens of exploratory attempts before settling on an approach.</p><p><strong>Auditability: </strong>When Elicit or Consensus Deep Search follows a PRISMA-like workflow, researchers can evaluate methodology independently. Flexible reasoning is harder to audit&#8212;how do you assess whether an agent&#8217;s self-designed approach was appropriate?</p><p>For standard literature reviews, systematic reviews, and discovery searches, workflow-optimized tools are often the right choice. Why have an LLM reinvent the wheel for well-understood tasks?</p><p>My critique isn&#8217;t that predetermined fixed workflow are bad&#8212;it&#8217;s that marketing language suggesting flexible reasoning misrepresents or at least can mislead users to overestimate the capabilities of the system.</p><h2>SciSpace Agents - does this break the mold</h2><p>Are there specialised academic search tools that work like truly flexible agents the way Claude, ChatGPT and Gemini are and can handle and reason out arbitrary literature review tasks?</p><p>If there is anyone that might be able to do it, it would be the new SciSpace Agents.</p><p><strong>SciSpace Agents</strong> (distinct from <a href="https://scispace.com/resources/open-ai-deep-research-scispace-deep-review/">SciSpace Deep Review</a>) represents an interesting architectural alternative. Rather than encoding fixed workflows, it exposes a toolkit and lets the LLM reason about using different tool combination.</p><p>From what I can see SciSpace Agents exposes a bunch of tools that you can use to ask it to try to accomplish your tasks.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!8upo!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!8upo!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png 424w, https://substackcdn.com/image/fetch/$s_!8upo!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png 848w, https://substackcdn.com/image/fetch/$s_!8upo!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png 1272w, https://substackcdn.com/image/fetch/$s_!8upo!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!8upo!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png" width="612" height="1062" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1062,&quot;width&quot;:612,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:50985,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!8upo!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png 424w, https://substackcdn.com/image/fetch/$s_!8upo!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png 848w, https://substackcdn.com/image/fetch/$s_!8upo!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png 1272w, https://substackcdn.com/image/fetch/$s_!8upo!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1fc81744-a04f-48d0-ac6e-cceb9c007061_612x1062.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>SciSpace Agents has an <a href="https://scispace.com/agents">Agent Gallery</a> that shows a wide variety of tasks that can be done with the tools with many relating to systematic review tasks, citation mapping, and various analytical workflows. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ph6E!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ph6E!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png 424w, https://substackcdn.com/image/fetch/$s_!ph6E!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png 848w, https://substackcdn.com/image/fetch/$s_!ph6E!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png 1272w, https://substackcdn.com/image/fetch/$s_!ph6E!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ph6E!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png" width="1456" height="685" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:685,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:112889,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ph6E!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png 424w, https://substackcdn.com/image/fetch/$s_!ph6E!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png 848w, https://substackcdn.com/image/fetch/$s_!ph6E!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png 1272w, https://substackcdn.com/image/fetch/$s_!ph6E!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4a996967-03b0-45d4-bbdd-837973de9cee_1770x833.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!hlAb!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!hlAb!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png 424w, https://substackcdn.com/image/fetch/$s_!hlAb!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png 848w, https://substackcdn.com/image/fetch/$s_!hlAb!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png 1272w, https://substackcdn.com/image/fetch/$s_!hlAb!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!hlAb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png" width="1456" height="779" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:779,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:63595,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!hlAb!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png 424w, https://substackcdn.com/image/fetch/$s_!hlAb!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png 848w, https://substackcdn.com/image/fetch/$s_!hlAb!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png 1272w, https://substackcdn.com/image/fetch/$s_!hlAb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7bb32ccb-bc22-40f2-8d52-fca7913a6f6e_1505x805.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Users can inspect the exact flow for each agent.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!cbr0!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!cbr0!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png 424w, https://substackcdn.com/image/fetch/$s_!cbr0!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png 848w, https://substackcdn.com/image/fetch/$s_!cbr0!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png 1272w, https://substackcdn.com/image/fetch/$s_!cbr0!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!cbr0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png" width="762" height="785" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:785,&quot;width&quot;:762,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:39107,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!cbr0!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png 424w, https://substackcdn.com/image/fetch/$s_!cbr0!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png 848w, https://substackcdn.com/image/fetch/$s_!cbr0!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png 1272w, https://substackcdn.com/image/fetch/$s_!cbr0!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F008a2804-765a-4d0c-ba8c-b07d4bd5da0a_762x785.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>SciSpace Agent is credit based (unlike SciSpace Deep Review), this gives you an idea of how expensive this process is.</p><p>So does it work? <a href="https://scispace.com/share/500ac4e6-7e0d-42e7-8345-a2a2882f3386">Sort of.</a></p><p>When I tried it, SciSpace Agents immediately behaved more like Claude/Gemini: it reasoned about what to do, identified the target paper, used various tools to find related work, extracted references into a JSON file with 52 entries, and attempted comparison, exactly as you would hope a agent or research assistant would do.</p><p>First, it identifies the target paper. Then it uses various tools such as Google Scholar, SciSpace Deep Review to find related papers, combines and dedupes </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!D8iP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!D8iP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png 424w, https://substackcdn.com/image/fetch/$s_!D8iP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png 848w, https://substackcdn.com/image/fetch/$s_!D8iP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png 1272w, https://substackcdn.com/image/fetch/$s_!D8iP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!D8iP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png" width="649" height="700" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ddb33723-710b-4421-899c-61bac6bd4325_649x700.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:700,&quot;width&quot;:649,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:60426,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!D8iP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png 424w, https://substackcdn.com/image/fetch/$s_!D8iP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png 848w, https://substackcdn.com/image/fetch/$s_!D8iP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png 1272w, https://substackcdn.com/image/fetch/$s_!D8iP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fddb33723-710b-4421-899c-61bac6bd4325_649x700.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Here&#8217;s the critical part, it is able to use some tool to get the references of the paper in JSON.</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!_2wM!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!_2wM!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png 424w, https://substackcdn.com/image/fetch/$s_!_2wM!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png 848w, https://substackcdn.com/image/fetch/$s_!_2wM!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png 1272w, https://substackcdn.com/image/fetch/$s_!_2wM!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!_2wM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png" width="616" height="212" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:212,&quot;width&quot;:616,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:15700,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!_2wM!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png 424w, https://substackcdn.com/image/fetch/$s_!_2wM!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png 848w, https://substackcdn.com/image/fetch/$s_!_2wM!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png 1272w, https://substackcdn.com/image/fetch/$s_!_2wM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffe5e020f-1e0f-4a9c-8cb6-c3d92a2bb047_616x212.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>I looked at the JSON it downloaded , it does indeed have the 52 references.</p><p>It then loads the JSON and tries to compare with the metadata of other papers found</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!f3G3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!f3G3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png 424w, https://substackcdn.com/image/fetch/$s_!f3G3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png 848w, https://substackcdn.com/image/fetch/$s_!f3G3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png 1272w, https://substackcdn.com/image/fetch/$s_!f3G3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!f3G3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png" width="1456" height="655" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:655,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:203385,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!f3G3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png 424w, https://substackcdn.com/image/fetch/$s_!f3G3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png 848w, https://substackcdn.com/image/fetch/$s_!f3G3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png 1272w, https://substackcdn.com/image/fetch/$s_!f3G3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fae3a0769-edd8-40ef-892e-d85ede0c2e6c_1849x832.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>I am not sure if it eventually succeeded but most of what it suggests are not cited (with a few exceptions where the matching failed due to incomplete metadata)</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!O8kF!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!O8kF!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png 424w, https://substackcdn.com/image/fetch/$s_!O8kF!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png 848w, https://substackcdn.com/image/fetch/$s_!O8kF!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png 1272w, https://substackcdn.com/image/fetch/$s_!O8kF!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!O8kF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png" width="1149" height="877" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:877,&quot;width&quot;:1149,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:69485,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/180946268?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!O8kF!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png 424w, https://substackcdn.com/image/fetch/$s_!O8kF!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png 848w, https://substackcdn.com/image/fetch/$s_!O8kF!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png 1272w, https://substackcdn.com/image/fetch/$s_!O8kF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc8d2e214-95c8-4c01-b607-a8f56da97466_1149x877.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><h2>Conclusion</h2><p>This simple citation gap test reveals that most current Academic Deep Search and Deep Research tools are workflow-based agents operating within predefined patterns&#8212;not flexible reasoning systems that analyze task structure and devise novel approaches.</p><p>This doesn&#8217;t diminish their value. Academic Deep Search&#8217;s iterative retrieval with LLM-based relevance judgment is a genuine breakthrough. Deep Research&#8217;s ability to generate well-cited reports fills real needs. These tools ARE agents in the technical sense, and within their designed scope, they work impressively.</p><p>But marketing language suggesting flexible reasoning, autonomous problem-solving, and human-like research assistance probably overstates current capabilities and can lead to misunderstanding by users who take the term &#8220;agent&#8221; or &#8220;research assistant&#8221; at face value.</p><p>Again Academic Deep Research tools are genuinely useful but you have to be careful with the type of literature review tasks you try to do. If your task fits the workflow, you&#8217;ll often get excellent results. If it doesn&#8217;t, you&#8217;ll may get a surprisingly fail.</p><blockquote><p>Given that standard LLMs like Claude Sonnet 4.5 on their home platforms  are more &#8220;agentic&#8221; than specialised Academic Deep Research tools and <a href="https://aarontay.substack.com/p/mcp-servers-and-academic-search-the">they now can potentially gain access to paywalled academic content via MCP servers</a>, such platforms might be even better for more &#8220;agentic&#8221; literature review tasks!</p></blockquote><p>The question that should be on our minds is - how do vendors of such products communicate to users the limits of their Deep Research product? </p><p></p><h2>Appendix - More about testing</h2><p>When testing variants of my query, these systems often fall into four common failure modes:</p><ol><li><p><strong>Chronological Errors (Future Citations)</strong> The system outputs references published <em>after</em> the target paper. For example, when using a 2018 paper as the anchor, some tools return papers from 2022. This indicates the LLM failed to process the temporal constraint (filtering for papers published on or before the selected paper&#8217;s publication year).</p></li><li><p><strong>Redundant Outputs (Citation Overlap)</strong> The system outputs papers that are already cited by the selected paper. This doesn&#8217;t always mean the tool failed to compare the lists. It often indicates a <strong>metadata mismatch</strong>: the tool found a variant of the paper (e.g., a preprint vs. the published version) that matched semantically but not digitally. However, a sufficiently &#8220;smart&#8221; agent should be able to resolve these entities. Generally, if only one or two outputs overlap, it is likely a metadata issue; if most overlap, the logic likely failed.</p></li><li><p><strong>Accidental Compliance (&#8221;Luck&#8221;)</strong> The system outputs papers that are not cited by the selected paper, despite failng to or being unable to check against the references entirely and happened to retrieve uncited works by chance. <em>Note:</em> In my specific test case, the selected paper has a highly comprehensive reference section. Therefore, it is unlikely a system could find many relevant, on-topic papers that are <em>not</em> cited purely by luck. If the results are relevant and uncited, the system likely performed the task correctly.</p></li><li><p><strong>Irrelevant Results</strong> The system outputs papers that do not overlap with the selected paper&#8217;s references, but they are not relevant to the topic. This suggests a retrieval failure. Alternatively, because the target paper&#8217;s reference section is so complete, the system may be forced to retrieve tangentially related papers to satisfy the &#8220;not cited&#8221; constraint.</p></li></ol><p>  </p>]]></content:encoded></item><item><title><![CDATA[Model Context Protocol (MCP) Servers - Wiley AI Gateway & PubMed - How Claude can now pilot test search strategies using PubMed]]></title><description><![CDATA[The Model Context Protocol may fundamentally change how AI tools access academic content. Rather than AI powered search engines building massive centralised indexes, MCP allows AI models to connect directly to publisher content in a real-time federated search model. This post demostrates the use of Wiley AI Gateway and PubMed connectors when connected to Claude, showing how Claude can now pilot test search strategies for evidence synthesis using Pubmed.]]></description><link>https://aarontay.substack.com/p/mcp-servers-and-academic-search-the</link><guid isPermaLink="false">https://aarontay.substack.com/p/mcp-servers-and-academic-search-the</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Sun, 30 Nov 2025 21:30:06 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!0FxO!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<p>AI search tools like <a href="http://elicit.com">Elicit</a>, <a href="http://Consensus.app">Consensus</a>, and <a href="http://scite.ai">Scite.ai </a>have spent years racing to build centralised indexes of academic content&#8212; first by indexing the open content that is available and then trying to get publisher partnerships. But unlike their predecessors of the 2010s - the <a href="https://musingsaboutlibrarianship.blogspot.com/search/label/web%20scale%20discovery">Web Scale Discovery systems</a> (now called &#8220;Discovery layers&#8221; or &#8220;Discovery Services&#8221;) like <a href="https://exlibrisgroup.com/products/summon-library-discovery/">Summon</a>, <a href="https://about.ebsco.com/products/ebsco-discovery-service">Ebsco Discovery Service</a>, <a href="https://exlibrisgroup.com/products/primo-discovery-service/">Primo</a>, publishers are much more wary of handing over content for indexing amid intense concerns about AI training on copyrighted material. The <a href="https://www.anthropic.com/news/model-context-protocol">Model Context Protocol(</a>MCP) offers an alternative path. MCP allows AI models to query publisher content directly through standardised servers, keeping full text on publisher infrastructure while enabling real-time retrieval. </p><p>Interestingly, this isn&#8217;t just an architectural workaround; it changes what&#8217;s possible. Using MCP, Claude can now pilot-test Boolean searches against PubMed, check MeSH headings, assess recall, and iteratively refine strategies&#8212;capabilities that were impossible when LLMs generated search strings blindly. For evidence synthesis and library discovery, this may be the most consequential development since federated search gave way to discovery layers.</p><p>Caveat: My understanding of MCP is still developing, so treat the technical details with appropriate caution.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy ne Coffee! (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy ne Coffee! (via ko-fi)</span></a></p><p></p><h2>Summary</h2><p>The <a href="https://www.anthropic.com/news/model-context-protocol">Model Context Protocol</a> may fundamentally change how AI tools access academic content. Rather than building massive centralised indexes (the approach taken by Elicit, Consensus, and others), MCP allows AI models to connect directly to publisher content through standardised &#8220;servers.&#8221;</p><p>I&#8217;ve been testing two MCP servers: the <a href="https://www.wiley.com/en-us/solutions-partnerships/ai-solutions/">Wiley AI Gateway</a> and a <a href="https://support.claude.com/en/articles/12614801-using-the-pubmed-connector-in-claude">PubMed MCP server </a>.</p><p>My key findings: </p><ul><li><p><strong>MCP makes AI-to-content connections are more transparent</strong>: You can see exactly how your natural language query gets translated and what content (metadata, text chunks or even full text) is retrieved</p></li><li><p><strong>Wiley&#8217;s approach is impressively open</strong>: They&#8217;ve shared their evaluation metrics with me and plan public transparency about search quality&#8212;a welcome departure from the opacity of traditional discovery vendors</p></li><li><p><strong>LLMs can now pilot-test Boolean search strategies</strong>: This is huge for evidence synthesis. Rather than generating search strings blindly, Claude can actually run searches against PubMed, check MeSH headings, and iteratively refine strategies</p></li><li><p><strong>History may not repeat</strong>: If you&#8217;ve been in libraries long enough, the architecture that MCP represents might sound familiar. We tried something like this before&#8212;<a href="https://federatedsearchblog.com/2009/03/19/beyond-federated-search/">federated search in the 2000s</a>&#8212;<a href="http://www.tandfonline.com/doi/abs/10.1080/19322909.2011.573533">and it failed</a>. But the technology and incentives have changed in ways that matter.</p></li></ul><p>Read on for detailed walkthroughs, JSON response examples, and my thoughts on what this means for libraries, publishers, and academic AI search vendors.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><h2>What is MCP?</h2><div id="youtube2-taeX8tgpPRQ" class="youtube-wrap" data-attrs="{&quot;videoId&quot;:&quot;taeX8tgpPRQ&quot;,&quot;startTime&quot;:null,&quot;endTime&quot;:null}" data-component-name="Youtube2ToDOM"><div class="youtube-inner"><iframe src="https://www.youtube-nocookie.com/embed/taeX8tgpPRQ?rel=0&amp;autoplay=0&amp;showinfo=0&amp;enablejsapi=0" frameborder="0" loading="lazy" gesture="media" allow="autoplay; fullscreen" allowautoplay="true" allowfullscreen="true" width="728" height="409"></iframe></div></div><p>MCP&#8212;Model Context Protocol&#8212;was created by Anthropic and released as an open-source standard in late 2024. I initially ignored it, but by 2025 both OpenAI and Google announced support, making it the de facto standard.</p><h2>The USB-C Analogy</h2><p>The easiest way to understand MCP is as a &#8220;USB-C port&#8221; for Artificial Intelligence.</p><p>Currently, most AI models are &#8220;walled gardens.&#8221; They have immense internal knowledge from pretraining but cannot easily access newer information or content they&#8217;ve never seen&#8212;such as your library&#8217;s subscription databases, catalogues, or repositories.</p><p>While most LLMs now have built-in web search tools to browse the web (kinda like a human), this method only accesses open content and tends to work slowly compared to direct API access to specific sources. However, this meants developers had to build custom integrations for every database they wanted the AI to access.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!-eo4!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!-eo4!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png 424w, https://substackcdn.com/image/fetch/$s_!-eo4!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png 848w, https://substackcdn.com/image/fetch/$s_!-eo4!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png 1272w, https://substackcdn.com/image/fetch/$s_!-eo4!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!-eo4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png" width="892" height="388" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:388,&quot;width&quot;:892,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:29124,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!-eo4!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png 424w, https://substackcdn.com/image/fetch/$s_!-eo4!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png 848w, https://substackcdn.com/image/fetch/$s_!-eo4!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png 1272w, https://substackcdn.com/image/fetch/$s_!-eo4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06d79bf5-c167-41ce-8eb4-929905ab22cd_892x388.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em>Defailt Web search in Claude, similar functionality exist in ChatGPT and Gemini</em></p><p></p><p>MCP solves this by creating a universal standard&#8212;an open protocol that lets any AI model plug into any data source instantly, without complex custom coding.</p><blockquote><p>MCP servers can be used for taking actions beyond just search of course, MCP servers can write documents, send emails etc. Edit: Rod Page has shared with me <a href="https://iphylo.blogspot.com/2025/11/model-context-protocol-mcp-and-triple.html">how another use case is using Large Language Models and MCP servers to provide a user-friendly way to query knowledge graphs/linked data without requring the user to know SPARQL.</a></p></blockquote><p>In short, the MCP servers you setup are like a menu that let the LLM/AI &#8220;know&#8221; what tools and functionality are available - which it can use when necessary.</p><h3>The &#8220;N &#215; M&#8221; Problem</h3><p>Before MCP, the AI industry faced a logistical challenge. There are dozens of AI models (ChatGPT, Claude, Gemini, Llama, etc.) and millions of data sources (PubMed, Wiley, JSTOR, Google Drive, Slack). Connecting PubMed to ChatGPT required custom code. Connecting PubMed to Claude? Different custom code. Every new AI model meant rebuilding integrations from scratch.</p><p>MCP acts like a universal power outlet. Instead of building a &#8220;PubMed-to-ChatGPT&#8221; connector, developers build a single &#8220;PubMed-to-MCP&#8221; server. Once built, any MCP-compliant AI can instantly plug in.</p><p>This explains why platforms like the Wiley AI Gateway exist. Wiley didn&#8217;t have to build separate integrations for every AI company&#8212;they built one MCP-compatible gateway. The same logic applies to libraries with open repositories. Previously, you&#8217;d have to decide: build a ChatGPT plugin? A Gemini &#8220;Gem&#8221;? Now you just offer an MCP server. </p><blockquote><h3>How MCP Relates to RAG</h3><p>How does Retrieval Augmented Generation (RAG) relate to MCP?</p><p><strong>RAG</strong> answers: &#8220;How do I find and use documents to ground the model&#8217;s answer?&#8221;</p><p><strong>MCP</strong> answers: &#8220;How does the model call the search and document APIs that let it do that?&#8221;</p><p>Systems can use MCP as part of your RAG pipeline. We will discuss this distinction in future posts</p></blockquote><h2>MCP server - Tools, Resources, Prompts</h2><p>MCP protocol consists of MCP host/client (e.g. Claude Desktop) and MCP Servers (e.g. Wiley AI Gateway).</p><blockquote><p>I will ignore the distinction between MCP host and MCP Client for now</p></blockquote><p>MCP servers can be on the cloud or it can be something run locally on your machine you connect to.</p><blockquote><p>There are somewhat technial <a href="https://huggingface.co/blog/mcp-for-research">guides on how to do this to connect to academic sources.</a> Most of these are to <a href="https://www.pulsemcp.com/servers/afrise-academic-search">MCP Servers that connect to open content like Arxiv</a>, <a href="https://mcpmarket.com/server/academic-search">Semantic Scholar, OpenAlex</a>. Even though the default Web Search is likely to be able to access the same sources, a direct MCP connection is likely to be faster. </p></blockquote><p>MCP servers consist of three main elements - Tools, Resources, Prompts</p><div id="youtube2-zPmJ8soT2DQ" class="youtube-wrap" data-attrs="{&quot;videoId&quot;:&quot;zPmJ8soT2DQ&quot;,&quot;startTime&quot;:null,&quot;endTime&quot;:null}" data-component-name="Youtube2ToDOM"><div class="youtube-inner"><iframe src="https://www.youtube-nocookie.com/embed/zPmJ8soT2DQ?rel=0&amp;autoplay=0&amp;showinfo=0&amp;enablejsapi=0" frameborder="0" loading="lazy" gesture="media" allow="autoplay; fullscreen" allowautoplay="true" allowfullscreen="true" width="728" height="409"></iframe></div></div><p>I won&#8217;t go in depth into the other two, but of these three elements, tools are probably the most important for us to understand because they are the &#8220;Verbs&#8221; or actions on what the MCP server allows the LLM to do. </p><p>Here is an example of the &#8220;tools&#8221; available to the <a href="https://support.claude.com/en/articles/12614801-using-the-pubmed-connector-in-claude">PubMed MCP server I connected to</a></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!kSL2!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!kSL2!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png 424w, https://substackcdn.com/image/fetch/$s_!kSL2!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png 848w, https://substackcdn.com/image/fetch/$s_!kSL2!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png 1272w, https://substackcdn.com/image/fetch/$s_!kSL2!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!kSL2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png" width="713" height="548" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:548,&quot;width&quot;:713,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:38039,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!kSL2!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png 424w, https://substackcdn.com/image/fetch/$s_!kSL2!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png 848w, https://substackcdn.com/image/fetch/$s_!kSL2!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png 1272w, https://substackcdn.com/image/fetch/$s_!kSL2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6bb131f8-da66-4c33-90cc-5b67c7ba84fb_713x548.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This gives you an idea of what the PubMed MCP server allows the LLM to do and not do, which will be very important for understanding what you can ask for.</p><p>For example, from this list, you can probably guess asking the LLM to use this MCP server to find citations of a given paper probably won&#8217;t work (&#8220;Lookup articles by citations&#8221; refers to verifying citations and finding PubMed IDs from journal references).</p><p>It can &#8220;search articles&#8221;, &#8220;Get article metadata&#8221; and also <a href="https://support.claude.com/en/articles/12614801-using-the-pubmed-connector-in-claude">retrieve 8 million full-text via PMC</a>.</p><p>Learn <a href="https://support.claude.com/en/articles/12614801-using-the-pubmed-connector-in-claude">more about the tools offered by PubMed connector.</a></p><p></p><h2>My testing setup</h2><p>For my blog series, I will be taking the easiest approach with no setup. </p><p>I will be using the Claude web interface (paid version needed) as the host/client and turn on connection to two specific connectors/MCP servers (connectors &amp; MCP servers will be used interchangably) which are already available to be turned on without any additional setup.</p><ol><li><p><a href="https://support.claude.com/en/articles/12614801-using-the-pubmed-connector-in-claude">PubMed MCP server (from Anthrophic)</a></p></li><li><p><a href="https://www.wiley.com/en-us/solutions-partnerships/ai-solutions/">Wiley AI Gateway</a> (listed as &#8220;Scholar Gateway&#8221; in the interface)</p></li></ol><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!oOAr!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!oOAr!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png 424w, https://substackcdn.com/image/fetch/$s_!oOAr!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png 848w, https://substackcdn.com/image/fetch/$s_!oOAr!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png 1272w, https://substackcdn.com/image/fetch/$s_!oOAr!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!oOAr!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png" width="866" height="493" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5839392e-613e-4c72-97b0-f529d35f5866_866x493.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:493,&quot;width&quot;:866,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:40568,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!oOAr!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png 424w, https://substackcdn.com/image/fetch/$s_!oOAr!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png 848w, https://substackcdn.com/image/fetch/$s_!oOAr!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png 1272w, https://substackcdn.com/image/fetch/$s_!oOAr!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5839392e-613e-4c72-97b0-f529d35f5866_866x493.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>You can of course add a lot more connectors/MCP servers both default or custom ones.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Gc1M!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Gc1M!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png 424w, https://substackcdn.com/image/fetch/$s_!Gc1M!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png 848w, https://substackcdn.com/image/fetch/$s_!Gc1M!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png 1272w, https://substackcdn.com/image/fetch/$s_!Gc1M!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Gc1M!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png" width="805" height="856" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:856,&quot;width&quot;:805,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:95880,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Gc1M!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png 424w, https://substackcdn.com/image/fetch/$s_!Gc1M!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png 848w, https://substackcdn.com/image/fetch/$s_!Gc1M!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png 1272w, https://substackcdn.com/image/fetch/$s_!Gc1M!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc8c89a3-82c1-41fd-b97e-8203d57dd115_805x856.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I think with some setup you can possibly also connect Claude to other academic sources like OpenAlex, Semantic Scholar, Arxiv or use ChatGPT plus to connect to custom MCP servers. </p><p> </p><h2>Testing the Wiley AI Gateway</h2><p><a href="https://newsroom.wiley.com/press-releases/press-release-details/2025/Wiley-Launches-Interoperable-Platform-to-Power-Scientific-Discovery-in-Worlds-Leading-AI-Technologies/default.aspx">Wiley appears to be one of the first major scholarly publishers to offer an official MCP server, launching in October 2025</a>. (Another <a href="https://www.statista.com/press/p/statista_next_ai_leap/?srsltid=AfmBOopL0-QXu3-WwGubPHLFfU-XIoSbzeucGUjWlhEw5G1_lxqx-RyI">early adopter is Statista</a>.) Based on their press release, they support platforms like Anthropic&#8217;s Claude, AWS Marketplace, Mistral AI&#8217;s Le Chat, and Perplexity.</p><p>When you first add the Wiley AI Gateway to Claude, you will see this support page.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!oIx5!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!oIx5!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png 424w, https://substackcdn.com/image/fetch/$s_!oIx5!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png 848w, https://substackcdn.com/image/fetch/$s_!oIx5!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png 1272w, https://substackcdn.com/image/fetch/$s_!oIx5!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!oIx5!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png" width="1213" height="662" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:662,&quot;width&quot;:1213,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:177091,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!oIx5!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png 424w, https://substackcdn.com/image/fetch/$s_!oIx5!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png 848w, https://substackcdn.com/image/fetch/$s_!oIx5!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png 1272w, https://substackcdn.com/image/fetch/$s_!oIx5!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F16fc168b-e4c2-4b91-9218-720cd7d11607_1213x662.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>It provides a ton of information</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!0FxO!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!0FxO!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png 424w, https://substackcdn.com/image/fetch/$s_!0FxO!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png 848w, https://substackcdn.com/image/fetch/$s_!0FxO!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png 1272w, https://substackcdn.com/image/fetch/$s_!0FxO!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!0FxO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png" width="1111" height="758" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:758,&quot;width&quot;:1111,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:247117,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!0FxO!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png 424w, https://substackcdn.com/image/fetch/$s_!0FxO!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png 848w, https://substackcdn.com/image/fetch/$s_!0FxO!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png 1272w, https://substackcdn.com/image/fetch/$s_!0FxO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb74db47a-0fa1-4f4c-9ac3-68a96368da80_1111x758.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Even advice on how to prompt</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!FtCG!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!FtCG!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png 424w, https://substackcdn.com/image/fetch/$s_!FtCG!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png 848w, https://substackcdn.com/image/fetch/$s_!FtCG!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png 1272w, https://substackcdn.com/image/fetch/$s_!FtCG!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!FtCG!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png" width="923" height="1018" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1018,&quot;width&quot;:923,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:101987,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!FtCG!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png 424w, https://substackcdn.com/image/fetch/$s_!FtCG!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png 848w, https://substackcdn.com/image/fetch/$s_!FtCG!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png 1272w, https://substackcdn.com/image/fetch/$s_!FtCG!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5d3078cc-8d8d-43b2-ae54-65b7ff98b707_923x1018.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>and a list of FAQs, but there seems to be no easy way to go back to this page except by disconnecting and connecting again.</p><p>I was given beta access and I (or more accurately Claude) can theoretically access the entire collection of 3 million Wiley articles through the Wiley AI Gateway MCP server. In my tests below, I used either Sonnet 4.5 or Opus 4.5, generally without &#8220;research&#8221; mode enabled. I turned off web search and only enabled the Wiley AI Gateway connector.</p><blockquote><p>As you will see later, both the Wiley AI Gateway and PubMed connector will fail for certain queries due to their limitations, but if you have the Web search functionlity turned on as well, it may be able to compensate for these issues</p></blockquote><h3>Transparency in Action</h3><p>While the FAQ suggests I need to state that I am looking for schoarly resources or to use Scholar Gateway, I found it always used it correctly when needed, perhaps because I turned off the other connectors like default web search.</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!IbGo!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!IbGo!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png 424w, https://substackcdn.com/image/fetch/$s_!IbGo!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png 848w, https://substackcdn.com/image/fetch/$s_!IbGo!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png 1272w, https://substackcdn.com/image/fetch/$s_!IbGo!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!IbGo!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png" width="1413" height="312" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:312,&quot;width&quot;:1413,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!IbGo!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png 424w, https://substackcdn.com/image/fetch/$s_!IbGo!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png 848w, https://substackcdn.com/image/fetch/$s_!IbGo!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png 1272w, https://substackcdn.com/image/fetch/$s_!IbGo!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14b44607-dba1-41a5-bc1a-b2bb369b169f_1413x312.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>One thing I didn&#8217;t appreciate until testing was how transparent everything is when using the Wiley AI Gateway through Claude&#8217;s interface. You can see all queries and responses in JSON.</p><p>Here&#8217;s <a href="https://claude.ai/share/315f8064-2b26-435a-a063-e7bde490bf0c">a simple prompt or query</a> I sent to Claude with only the Wiley AI Gateway enabled: </p><p>You can see my prompt and Claude &#8220;thinking&#8221; and &#8220;deciding&#8221; to search for papers by calling the Scholar Gateway Search with what Claude calls a &#8220;<a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably">semantic search</a>&#8221;.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!QnLb!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!QnLb!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png 424w, https://substackcdn.com/image/fetch/$s_!QnLb!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png 848w, https://substackcdn.com/image/fetch/$s_!QnLb!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png 1272w, https://substackcdn.com/image/fetch/$s_!QnLb!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!QnLb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png" width="947" height="632" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:632,&quot;width&quot;:947,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:46721,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!QnLb!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png 424w, https://substackcdn.com/image/fetch/$s_!QnLb!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png 848w, https://substackcdn.com/image/fetch/$s_!QnLb!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png 1272w, https://substackcdn.com/image/fetch/$s_!QnLb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff4395c4d-d8a1-44bc-9260-9d8a734b0c22_947x632.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Even with minimum JSON familarity, you should be able to make out how my natural language query was translated&#8212;correctly limiting results from 2020 to 2025. It also retrieves the top 20 ranked results.</p><p></p><h3>Under the Hood: RAG with Chunks</h3><p>The Wiley team explained that what happens in the background is standard RAG: full text is chunked, and<a href="https://aarontay.substack.com/p/why-embedding-vector-search-is-probably"> &#8220;semantic search&#8221; (dense embedding/retrieval)</a> matches chunks to queries with reranking of the top 30 chunks. I was told they plan to add hybrid search (possibly BM25?) and/or knowledge graphs in the future.</p><p>This is backed up by the FAQ</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!lvud!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!lvud!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png 424w, https://substackcdn.com/image/fetch/$s_!lvud!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png 848w, https://substackcdn.com/image/fetch/$s_!lvud!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png 1272w, https://substackcdn.com/image/fetch/$s_!lvud!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!lvud!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png" width="1301" height="291" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/13543c38-c642-4c82-a922-753783cfc41c_1301x291.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:291,&quot;width&quot;:1301,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:45396,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!lvud!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png 424w, https://substackcdn.com/image/fetch/$s_!lvud!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png 848w, https://substackcdn.com/image/fetch/$s_!lvud!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png 1272w, https://substackcdn.com/image/fetch/$s_!lvud!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13543c38-c642-4c82-a922-753783cfc41c_1301x291.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>Coverage wise it currently covers 3 million or so articles from Wiley, but there are plans to include other publishers content who partner with Wiley </p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!SfTY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!SfTY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png 424w, https://substackcdn.com/image/fetch/$s_!SfTY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png 848w, https://substackcdn.com/image/fetch/$s_!SfTY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png 1272w, https://substackcdn.com/image/fetch/$s_!SfTY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!SfTY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png" width="1409" height="342" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/dd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:342,&quot;width&quot;:1409,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:55109,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!SfTY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png 424w, https://substackcdn.com/image/fetch/$s_!SfTY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png 848w, https://substackcdn.com/image/fetch/$s_!SfTY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png 1272w, https://substackcdn.com/image/fetch/$s_!SfTY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd7bb53b-3abf-42a5-ade7-142ecf2805fa_1409x342.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p></p><h3>Impressive Transparency on Search Quality</h3><p>What really impressed me was Wiley&#8217;s willingness to share their evaluation metrics&#8212;and their permission for me to share some details publicly.</p><p>I am told they plan to be very transparent about how they measure quality, though they&#8217;re still finalising the exact format for disclosure. This is a bold and welcome step. We&#8217;ve always lacked this transparency from discovery vendors, and it raises the bar significantly. Given that Wiley AI Gateway is probably one of the first major academic MCP servers, hopefully it sets a standard for others.</p><p>Below is a small sniplets of what they shared with me.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!NwtO!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!NwtO!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png 424w, https://substackcdn.com/image/fetch/$s_!NwtO!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png 848w, https://substackcdn.com/image/fetch/$s_!NwtO!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png 1272w, https://substackcdn.com/image/fetch/$s_!NwtO!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!NwtO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png" width="611" height="460" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:460,&quot;width&quot;:611,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:24727,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!NwtO!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png 424w, https://substackcdn.com/image/fetch/$s_!NwtO!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png 848w, https://substackcdn.com/image/fetch/$s_!NwtO!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png 1272w, https://substackcdn.com/image/fetch/$s_!NwtO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06e8b215-3d1b-4fd3-921a-34e82f292ebb_611x460.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Looking at their evaluations (based on 750 questions from their test set), the DOI precision@10 of 85.2% makes sense. This implies that if you search for a paper by DOI, there&#8217;s a roughly 15% chance the correct paper doesn&#8217;t appear in the top 10. In fact, one of my first tests failed to retrieve a paper by DOI, initially making me think the tool couldn&#8217;t handle DOI retrieval at all.</p><p>Chunk Precision@10 of 68.4% looks bad, but in the report they shared, they benchmarked against a leading dense embedding model (BGE-M3) which was only 8% better, so while there is some improvement to go, it is not terrible, </p><h2> The Response Format</h2><p> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7upA!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7upA!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png 424w, https://substackcdn.com/image/fetch/$s_!7upA!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png 848w, https://substackcdn.com/image/fetch/$s_!7upA!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png 1272w, https://substackcdn.com/image/fetch/$s_!7upA!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7upA!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png" width="668" height="290" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:290,&quot;width&quot;:668,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:59426,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!7upA!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png 424w, https://substackcdn.com/image/fetch/$s_!7upA!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png 848w, https://substackcdn.com/image/fetch/$s_!7upA!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png 1272w, https://substackcdn.com/image/fetch/$s_!7upA!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6d2aa86-1297-41b7-aa55-d482c71cc373_668x290.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Responses come in JSON and are relatively easy to interpret. For a typical query, it retrieves 20 results. For each result, you can see:</p><ul><li><p>Chunk number retrieved and the total number of chunks in the article</p></li><li><p>Metadata: article title, journal title, volume, issue, page, publication type, ISSN, publisher, abstract etc</p></li><li><p>Retraction status (important <a href="https://retractionwatch.com/2025/11/19/ai-unreliable-identifying-retracted-research-papers-study/">since LLMs often cite retracted works that are retrieved</a> &amp; one can filter retracted papers off - or perhaps the LLM given this information can use it in the generated answer), Open Access status</p></li><li><p>The actual text of the chunk</p></li><li><p>Relevance scores (rerank_score, rrf_score)</p></li></ul><p>For the first result, you can see that it says it retrieved chunk 9 and various metadata of the article.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!-xuP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!-xuP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png 424w, https://substackcdn.com/image/fetch/$s_!-xuP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png 848w, https://substackcdn.com/image/fetch/$s_!-xuP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png 1272w, https://substackcdn.com/image/fetch/$s_!-xuP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!-xuP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png" width="1456" height="730" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:730,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:95640,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!-xuP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png 424w, https://substackcdn.com/image/fetch/$s_!-xuP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png 848w, https://substackcdn.com/image/fetch/$s_!-xuP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png 1272w, https://substackcdn.com/image/fetch/$s_!-xuP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9e44a3dc-c03b-4f39-bf6d-c5ffc512a05d_1914x959.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>You can even see this article has 15 chunks in total and the text that makes up chunk 9. </p><p>The &#8220;id&#8221; field, is actually a combination of the article doi followed by _&lt;chunknumber&gt; which allows the LLM to combine chunks across the same article when needed.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!sjSJ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!sjSJ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png 424w, https://substackcdn.com/image/fetch/$s_!sjSJ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png 848w, https://substackcdn.com/image/fetch/$s_!sjSJ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png 1272w, https://substackcdn.com/image/fetch/$s_!sjSJ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!sjSJ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png" width="583" height="609" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c59539a9-ab8e-4c74-9818-764176cc929b_583x609.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:609,&quot;width&quot;:583,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:49432,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!sjSJ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png 424w, https://substackcdn.com/image/fetch/$s_!sjSJ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png 848w, https://substackcdn.com/image/fetch/$s_!sjSJ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png 1272w, https://substackcdn.com/image/fetch/$s_!sjSJ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc59539a9-ab8e-4c74-9818-764176cc929b_583x609.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Finally you can even see the final relevance score after reranking for each chunk &#8220;rerank_score&#8221;. </p><p>&#8220;rrf_score&#8221; probably stands for <a href="https://medium.com/@devalshah1619/mathematical-intuition-behind-reciprocal-rank-fusion-rrf-explained-in-2-mins-002df0cc5e2a">Reciprocal Rank Fusion</a>, which is a way to calculate a combined rank based on multiple ranking scores. For example, a system which give a seperate score/ranking using BM25 and Dense embedding can use RRF to combine the two to get a &#8220;fused&#8221;/combined rank.</p><blockquote><p>The &#8220;rrf_score&#8221; currently shows zero all the time because the system is just doing &#8220;Semantic search&#8221;, though hybrid search might be coming.</p></blockquote><p>From there Claude will use the 20 retrieved chunks to try to answer my question which much like how RAG or retrieval augmented generation works. </p><h2>Preliminary Observations of the Wiley AI Gateway </h2><p>I spent considerable time exploring how inputs get translated into search queries. You&#8217;ll quickly discover that there are queries it can&#8217;t handle&#8212;either because the LLM translates it strangely or because the MCP server lacks certain capabilities.</p><p>For example, <a href="https://claude.ai/share/7d99a185-73cc-413f-b7ae-69007ee1b134">I asked it to look up a paper and show references from a certain year, but it reported it couldn&#8217;t access references via the MCP server</a>. Another example: inspired by <a href="https://arxiv.org/abs/2510.22242">recent research</a>, I found it <a href="https://claude.ai/share/29cddc9f-3502-4391-8b5b-7961dcd2ca22">generally struggled to find &#8220;the last sentence of a paper&#8221;</a>. You would think since the metadata actually states the number of chunks in the article so in theory the last chunk (which usually excludes references) should be identifiable. That said, I suspect this MCP server has no way to request by chunk number. <a href="https://claude.ai/share/7d776443-e5dd-4d4e-808e-4deb3d238b91">Opus 4.5 sometimes figures it out anyway</a> but a lexical search instead of just a semantic search should easily nail this.</p><p>Requesting figures or tables generally works well.</p><blockquote><p>This highlights an emerging challenge for natural language search interfaces: we lack affordances showing what&#8217;s possible (e.g. filters available). With agentic search, the range of possible tasks has expanded so dramatically that users don&#8217;t know what&#8217;s achievable and what isn&#8217;t. E.g. Can Claude use Wiley Connector to look up a paper, find related papers that are related and could have been cited but are not cited? Answer : With the Wiley Connector no because it can&#8217;t easily access the references to check.</p></blockquote><p>Often, turning on the free web search connector solves issues&#8212;if an Open Access copy exists. For example, for the issue of finding the last sentence, or finding references of a certain range, the web search connector might be able to download a open access version of the paper and extract the answer from the whole paper&#8217;s full text overcoming the limitation of chunk based retrieval only.</p><p>Lots more testing needed!</p><h2>Testing the PubMed MCP Server</h2><p>While exploring the Wiley AI Gateway, I discovered you could also enable a PubMed MCP server. It&#8217;s appears to be one <a href="https://support.claude.com/en/articles/12614801-using-the-pubmed-connector-in-claude">offered by Anthropic</a>, but unclear if NLM is involved. </p><blockquote><p>There is of course some risks using MCP servers (either locally or remotely) by third parties since this involves running code in the background. But given this one seems officially offered by Anthropic it should be fine.</p></blockquote><p>I used similar settings: extended thinking on, research mode off, web search off, only the PubMed connector enabled.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!kZrm!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!kZrm!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png 424w, https://substackcdn.com/image/fetch/$s_!kZrm!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png 848w, https://substackcdn.com/image/fetch/$s_!kZrm!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png 1272w, https://substackcdn.com/image/fetch/$s_!kZrm!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!kZrm!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png" width="855" height="510" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:510,&quot;width&quot;:855,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:43404,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!kZrm!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png 424w, https://substackcdn.com/image/fetch/$s_!kZrm!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png 848w, https://substackcdn.com/image/fetch/$s_!kZrm!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png 1272w, https://substackcdn.com/image/fetch/$s_!kZrm!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92fff0fe-a948-46db-972f-1cd4638f340f_855x510.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The PubMed MCP server works quite differently from Wiley&#8217;s. </p><p>One key difference: it displays the available tools, giving you a clearer idea of capabilities.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!xveQ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!xveQ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png 424w, https://substackcdn.com/image/fetch/$s_!xveQ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png 848w, https://substackcdn.com/image/fetch/$s_!xveQ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png 1272w, https://substackcdn.com/image/fetch/$s_!xveQ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!xveQ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png" width="611" height="482" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:482,&quot;width&quot;:611,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:32992,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!xveQ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png 424w, https://substackcdn.com/image/fetch/$s_!xveQ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png 848w, https://substackcdn.com/image/fetch/$s_!xveQ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png 1272w, https://substackcdn.com/image/fetch/$s_!xveQ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe05fb90c-0876-4ecd-9f52-952be48b27dd_611x482.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Secondly as you will see later, it actually uses the default PubMed search to retrieve results after which it can retrieve the complete full-text (not chunks) via PMC.</p><p>The document suggests the PubMed connector is quite capable of searching for &#8220;most cited papers&#8221; - though when I tested, Claude claimed &#8220;PubMed doesn&#8217;t directly provide citation counts in its search results&#8221;. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!8P8z!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!8P8z!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png 424w, https://substackcdn.com/image/fetch/$s_!8P8z!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png 848w, https://substackcdn.com/image/fetch/$s_!8P8z!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png 1272w, https://substackcdn.com/image/fetch/$s_!8P8z!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!8P8z!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png" width="1131" height="699" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:699,&quot;width&quot;:1131,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:86018,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!8P8z!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png 424w, https://substackcdn.com/image/fetch/$s_!8P8z!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png 848w, https://substackcdn.com/image/fetch/$s_!8P8z!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png 1272w, https://substackcdn.com/image/fetch/$s_!8P8z!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F06a83876-0a3f-4f26-86f7-e8768a83eaf5_1131x699.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Lots of testing needed to see what this connector is capable of but for my <a href="https://claude.ai/share/429e6ace-40b3-4362-8163-4233c2ee079a">first test searching for papers on impact of exercise on cancer</a>, Claude was somewhat lazy&#8212;it went with the simplest possible query:</p><p> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ySll!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ySll!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png 424w, https://substackcdn.com/image/fetch/$s_!ySll!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png 848w, https://substackcdn.com/image/fetch/$s_!ySll!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png 1272w, https://substackcdn.com/image/fetch/$s_!ySll!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ySll!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png" width="679" height="305" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:305,&quot;width&quot;:679,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:33436,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ySll!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png 424w, https://substackcdn.com/image/fetch/$s_!ySll!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png 848w, https://substackcdn.com/image/fetch/$s_!ySll!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png 1272w, https://substackcdn.com/image/fetch/$s_!ySll!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F251eeb0c-9082-498c-9c2b-721bc3cff4ca_679x305.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>As you can see from the Json request below, it literally did the equalvant of entering in Pubmed</p><p><code>exercise cancer </code></p><p>and retrieved the top 15 results by PMID</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!de1X!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!de1X!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png 424w, https://substackcdn.com/image/fetch/$s_!de1X!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png 848w, https://substackcdn.com/image/fetch/$s_!de1X!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png 1272w, https://substackcdn.com/image/fetch/$s_!de1X!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!de1X!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png" width="589" height="248" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:248,&quot;width&quot;:589,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:11476,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!de1X!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png 424w, https://substackcdn.com/image/fetch/$s_!de1X!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png 848w, https://substackcdn.com/image/fetch/$s_!de1X!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png 1272w, https://substackcdn.com/image/fetch/$s_!de1X!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1cce0f13-4c6c-4959-9906-244dfbd09bfc_589x248.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This is the response.</p><p>It retrieved the top 15 results by PMID (see screencap below),</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!cpsE!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!cpsE!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png 424w, https://substackcdn.com/image/fetch/$s_!cpsE!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png 848w, https://substackcdn.com/image/fetch/$s_!cpsE!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png 1272w, https://substackcdn.com/image/fetch/$s_!cpsE!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!cpsE!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png" width="785" height="301" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:301,&quot;width&quot;:785,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:16182,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!cpsE!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png 424w, https://substackcdn.com/image/fetch/$s_!cpsE!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png 848w, https://substackcdn.com/image/fetch/$s_!cpsE!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png 1272w, https://substackcdn.com/image/fetch/$s_!cpsE!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fac56bf31-003f-454e-a6fd-6f98ad99c383_785x301.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>plus the total number of hits and query translation (presumably via Auto Term Mapping).  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!q4re!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!q4re!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png 424w, https://substackcdn.com/image/fetch/$s_!q4re!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png 848w, https://substackcdn.com/image/fetch/$s_!q4re!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png 1272w, https://substackcdn.com/image/fetch/$s_!q4re!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!q4re!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png" width="643" height="257" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:257,&quot;width&quot;:643,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:44838,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!q4re!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png 424w, https://substackcdn.com/image/fetch/$s_!q4re!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png 848w, https://substackcdn.com/image/fetch/$s_!q4re!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png 1272w, https://substackcdn.com/image/fetch/$s_!q4re!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70f6c34b-9566-43be-a1d1-05a74c924532_643x257.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I confirmed this was working as expected by running the same query through PubMed&#8217;s web interface: I got 35,718 hits (one more than the MCP server for some odd reason). The top 15 PMIDs matched what I got sorting by &#8220;Best match&#8221; in this case, though I have seen it query with &#8220;most recent&#8221; sorting in some cases as well.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7fx8!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7fx8!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png 424w, https://substackcdn.com/image/fetch/$s_!7fx8!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png 848w, https://substackcdn.com/image/fetch/$s_!7fx8!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png 1272w, https://substackcdn.com/image/fetch/$s_!7fx8!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7fx8!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png" width="851" height="810" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:810,&quot;width&quot;:851,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:91069,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7fx8!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png 424w, https://substackcdn.com/image/fetch/$s_!7fx8!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png 848w, https://substackcdn.com/image/fetch/$s_!7fx8!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png 1272w, https://substackcdn.com/image/fetch/$s_!7fx8!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffd0d6699-66ce-4b78-86af-ab794d7193ef_851x810.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Claude then used those 15 PMIDs to request article metadata (title, abstract, etc.) and generated an answer from there.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Todi!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Todi!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png 424w, https://substackcdn.com/image/fetch/$s_!Todi!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png 848w, https://substackcdn.com/image/fetch/$s_!Todi!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png 1272w, https://substackcdn.com/image/fetch/$s_!Todi!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Todi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png" width="652" height="309" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:309,&quot;width&quot;:652,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:17068,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Todi!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png 424w, https://substackcdn.com/image/fetch/$s_!Todi!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png 848w, https://substackcdn.com/image/fetch/$s_!Todi!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png 1272w, https://substackcdn.com/image/fetch/$s_!Todi!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6adec07-2a20-4849-af45-dad2e8faebfb_652x309.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This part of the response</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!9uWX!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!9uWX!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png 424w, https://substackcdn.com/image/fetch/$s_!9uWX!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png 848w, https://substackcdn.com/image/fetch/$s_!9uWX!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png 1272w, https://substackcdn.com/image/fetch/$s_!9uWX!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!9uWX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png" width="655" height="251" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:251,&quot;width&quot;:655,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:24263,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!9uWX!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png 424w, https://substackcdn.com/image/fetch/$s_!9uWX!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png 848w, https://substackcdn.com/image/fetch/$s_!9uWX!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png 1272w, https://substackcdn.com/image/fetch/$s_!9uWX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbad54e35-0baa-4456-bfa6-1b1914750a04_655x251.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>So from there it uses the metadata including title and abstract to generate an answer.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!y35g!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!y35g!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png 424w, https://substackcdn.com/image/fetch/$s_!y35g!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png 848w, https://substackcdn.com/image/fetch/$s_!y35g!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png 1272w, https://substackcdn.com/image/fetch/$s_!y35g!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!y35g!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png" width="672" height="584" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:584,&quot;width&quot;:672,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:91516,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!y35g!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png 424w, https://substackcdn.com/image/fetch/$s_!y35g!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png 848w, https://substackcdn.com/image/fetch/$s_!y35g!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png 1272w, https://substackcdn.com/image/fetch/$s_!y35g!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc6c4e923-36b8-48f5-8f8f-c4e8355e267f_672x584.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2>Retrieving full text vs text chunks</h2><p>As you can see from the tool list, this Pubmed MCP server can also ask for full-text. But this is done only by feeding it PMIDs. Unlike the Wiley AI Gateway server (where you can get only chunks of text) you get the whole paper&#8217;s full-text (if available in PMC) in the response and not just chunks.</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!EweF!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!EweF!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png 424w, https://substackcdn.com/image/fetch/$s_!EweF!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png 848w, https://substackcdn.com/image/fetch/$s_!EweF!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png 1272w, https://substackcdn.com/image/fetch/$s_!EweF!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!EweF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png" width="578" height="175" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:175,&quot;width&quot;:578,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:6494,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!EweF!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png 424w, https://substackcdn.com/image/fetch/$s_!EweF!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png 848w, https://substackcdn.com/image/fetch/$s_!EweF!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png 1272w, https://substackcdn.com/image/fetch/$s_!EweF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F70ebacaa-470e-4b93-887e-cab1cc5ac63f_578x175.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>This is why it can more easily answer questions like &#8220;<a href="https://claude.ai/share/8cd79c4d-2dfe-4ca5-91bd-89e63e60c419">find me the last sentence of The state of OA: a large-scale analysis of the prevalence and impact of Open Access articles</a>&#8221;</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!DkB5!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!DkB5!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png 424w, https://substackcdn.com/image/fetch/$s_!DkB5!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png 848w, https://substackcdn.com/image/fetch/$s_!DkB5!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png 1272w, https://substackcdn.com/image/fetch/$s_!DkB5!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!DkB5!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png" width="578" height="482" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:482,&quot;width&quot;:578,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:62536,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!DkB5!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png 424w, https://substackcdn.com/image/fetch/$s_!DkB5!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png 848w, https://substackcdn.com/image/fetch/$s_!DkB5!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png 1272w, https://substackcdn.com/image/fetch/$s_!DkB5!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F92f1353c-ebd0-4edf-8aed-a23c2a31b11a_578x482.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>However, like Wiley, the full text here doesn&#8217;t include references, and the metadata lacks them entirely. Questions like &#8220;<a href="https://claude.ai/share/16f85b86-f601-4a85-a10c-656d35a51793">find me papers referenced by X from 2016&#8211;2017</a>&#8221; remain tricky&#8212;though since you can get full text via PMC, the LLM can potentially download and use inline references to attempt an answer. </p><p>In comparison, Wiley AI Gateway only gives you chunks.</p><h2>A Game-Changer: LLMs Can Now Pilot-Test Boolean Search Strategies</h2><p>Since ChatGPT launched, evidence synthesis researchers have explored two main applications: <a href="https://app.undermind.ai/report/b65b2b0710729959bcc0a6006463c898298622b01b60d5dc7e3a592205e110c5">using LLMs as screeners</a> (promising but uneven results) and using them to<a href="https://app.undermind.ai/report/8f6940b18b8a7c8bbf5ee1b080dde713fe492b976f0be4c8ebfaa15235e42a24"> generate Boolean search strings </a>(<a href="https://app.undermind.ai/report/8f6940b18b8a7c8bbf5ee1b080dde713fe492b976f0be4c8ebfaa15235e42a24">largely unsuccessful</a>).</p><p>Studies pitting librarians against ChatGPT on generating Boolean search queries <a href="https://journals.sagepub.com/doi/10.1177/03400352241263532">such as this one</a>, consistently showed humans generating strategies with far better recall, while LLMs tended toward higher precision but lower recall. More recent studies tried different prompting strategies and even fine-tuning&#8212;with no greater success.</p><p>I always felt these comparisons were unfair. Human searchers can look things up, check the MeSH browser, and pilot-test different strategies. LLMs could not.</p><p>Until now&#8212;via the PubMed MCP server</p><blockquote><p>Note: The PubMed MCP server seems to have a bug that breaks with queries that are too long, forcing the LLM to test simpler versions. I&#8217;ll ignore this issue for now.</p></blockquote><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!2z4V!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!2z4V!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png 424w, https://substackcdn.com/image/fetch/$s_!2z4V!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png 848w, https://substackcdn.com/image/fetch/$s_!2z4V!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png 1272w, https://substackcdn.com/image/fetch/$s_!2z4V!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!2z4V!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png" width="1296" height="512" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:512,&quot;width&quot;:1296,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:54185,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!2z4V!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png 424w, https://substackcdn.com/image/fetch/$s_!2z4V!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png 848w, https://substackcdn.com/image/fetch/$s_!2z4V!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png 1272w, https://substackcdn.com/image/fetch/$s_!2z4V!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F027689fb-ea0a-40fb-98cd-c5c6a51409eb_1296x512.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p></p><h2>Example: Evaluating a Boolean Search Strategy</h2><p>When I asked Claude to evaluate a Boolean search strategy, it:</p><ul><li><p>Identified the main concept blocks</p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!GGhN!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!GGhN!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png 424w, https://substackcdn.com/image/fetch/$s_!GGhN!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png 848w, https://substackcdn.com/image/fetch/$s_!GGhN!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png 1272w, https://substackcdn.com/image/fetch/$s_!GGhN!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!GGhN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png" width="596" height="378" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:378,&quot;width&quot;:596,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:48915,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!GGhN!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png 424w, https://substackcdn.com/image/fetch/$s_!GGhN!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png 848w, https://substackcdn.com/image/fetch/$s_!GGhN!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png 1272w, https://substackcdn.com/image/fetch/$s_!GGhN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2b5dae61-7d64-4502-9ddb-d0b097efa56f_596x378.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><ul><li><p>Ran the search to grab top-ranked 5 items by PMID and retrieve their metadata</p><p> </p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mn0Z!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mn0Z!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png 424w, https://substackcdn.com/image/fetch/$s_!mn0Z!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png 848w, https://substackcdn.com/image/fetch/$s_!mn0Z!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png 1272w, https://substackcdn.com/image/fetch/$s_!mn0Z!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mn0Z!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png" width="621" height="643" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c130c453-6a2f-441d-b31f-20aefce76947_621x643.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:643,&quot;width&quot;:621,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:52943,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mn0Z!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png 424w, https://substackcdn.com/image/fetch/$s_!mn0Z!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png 848w, https://substackcdn.com/image/fetch/$s_!mn0Z!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png 1272w, https://substackcdn.com/image/fetch/$s_!mn0Z!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc130c453-6a2f-441d-b31f-20aefce76947_621x643.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><ul><li><p>Then it &#8220;notices&#8221; something</p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!9BfS!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!9BfS!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png 424w, https://substackcdn.com/image/fetch/$s_!9BfS!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png 848w, https://substackcdn.com/image/fetch/$s_!9BfS!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png 1272w, https://substackcdn.com/image/fetch/$s_!9BfS!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!9BfS!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png" width="551" height="189" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/df26e863-4623-46d2-860d-f7e5c587c96d_551x189.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:189,&quot;width&quot;:551,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:23955,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!9BfS!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png 424w, https://substackcdn.com/image/fetch/$s_!9BfS!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png 848w, https://substackcdn.com/image/fetch/$s_!9BfS!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png 1272w, https://substackcdn.com/image/fetch/$s_!9BfS!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf26e863-4623-46d2-860d-f7e5c587c96d_551x189.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><ul><li><p>It decided to check whether MeSH headings existed and &#8220;wondered&#8221; whether to drop the outcome block (conventional wisdom in many cases)</p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mOk4!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mOk4!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png 424w, https://substackcdn.com/image/fetch/$s_!mOk4!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png 848w, https://substackcdn.com/image/fetch/$s_!mOk4!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png 1272w, https://substackcdn.com/image/fetch/$s_!mOk4!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mOk4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png" width="503" height="96" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:96,&quot;width&quot;:503,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:14515,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mOk4!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png 424w, https://substackcdn.com/image/fetch/$s_!mOk4!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png 848w, https://substackcdn.com/image/fetch/$s_!mOk4!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png 1272w, https://substackcdn.com/image/fetch/$s_!mOk4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8b234291-11b5-4061-86b1-6f814f656d0a_503x96.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>I won&#8217;t screencap every step, but here&#8217;s what it conclused.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!9eOc!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!9eOc!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png 424w, https://substackcdn.com/image/fetch/$s_!9eOc!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png 848w, https://substackcdn.com/image/fetch/$s_!9eOc!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png 1272w, https://substackcdn.com/image/fetch/$s_!9eOc!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!9eOc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png" width="489" height="629" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:629,&quot;width&quot;:489,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:64334,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!9eOc!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png 424w, https://substackcdn.com/image/fetch/$s_!9eOc!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png 848w, https://substackcdn.com/image/fetch/$s_!9eOc!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png 1272w, https://substackcdn.com/image/fetch/$s_!9eOc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb83b954a-5beb-489f-ba32-9f4e4ab29c65_489x629.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Evidence synthesis experts might critique the specific choices of what to test and judgments made while thinking, but that misses the point: <em>it is now capable of testing search strategies in PubMed!</em></p><p>In another run, it assessed precision by trying to find landmark papers and checking if the search retrieved them. For this, I will not screencap the JSON output and just show some highlights. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7HqM!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7HqM!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png 424w, https://substackcdn.com/image/fetch/$s_!7HqM!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png 848w, https://substackcdn.com/image/fetch/$s_!7HqM!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png 1272w, https://substackcdn.com/image/fetch/$s_!7HqM!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7HqM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png" width="474" height="385" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:385,&quot;width&quot;:474,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:38333,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7HqM!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png 424w, https://substackcdn.com/image/fetch/$s_!7HqM!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png 848w, https://substackcdn.com/image/fetch/$s_!7HqM!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png 1272w, https://substackcdn.com/image/fetch/$s_!7HqM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ae0d106-33c2-4397-bcaa-a4b2dee60a67_474x385.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>After testing it gives this</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!bfeb!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!bfeb!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png 424w, https://substackcdn.com/image/fetch/$s_!bfeb!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png 848w, https://substackcdn.com/image/fetch/$s_!bfeb!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png 1272w, https://substackcdn.com/image/fetch/$s_!bfeb!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!bfeb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png" width="512" height="392" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:392,&quot;width&quot;:512,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:42240,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!bfeb!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png 424w, https://substackcdn.com/image/fetch/$s_!bfeb!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png 848w, https://substackcdn.com/image/fetch/$s_!bfeb!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png 1272w, https://substackcdn.com/image/fetch/$s_!bfeb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F13176bb0-2c90-4be9-88cf-fd13d49c1743_512x392.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I am not sure the way it assesses precision is the right way to do it but in any case, I do see it test proposed search queries against known &#8220;landmark paper&#8221; to see if search finds it method.</p><p>I expect librarians who are good at piloting searches can do a much better evaluation of what it did than me so I won&#8217;t try to do it.</p><p>In the long run, I wonder if experts could &#8220;teach&#8221; it via example in prompts or even thedo finetuning to pilot test better?</p><h2>Using Deep research mode</h2><p>With extended thinking enabled, results improve before it thinks longer. Turning on Deep Research mode (&#8221;research&#8221; in Claude) likely produces even more thorough testing&#8212;in one case involving deep research, it made 85 tool calls of &#8220;search article.&#8221;  </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!vguq!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!vguq!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png 424w, https://substackcdn.com/image/fetch/$s_!vguq!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png 848w, https://substackcdn.com/image/fetch/$s_!vguq!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png 1272w, https://substackcdn.com/image/fetch/$s_!vguq!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!vguq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png" width="1456" height="643" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:643,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:186180,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!vguq!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png 424w, https://substackcdn.com/image/fetch/$s_!vguq!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png 848w, https://substackcdn.com/image/fetch/$s_!vguq!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png 1272w, https://substackcdn.com/image/fetch/$s_!vguq!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc3da166f-616b-47f5-8f1c-8daed7627f25_1787x789.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>That said in some runs it will decide that doing so is &#8220;overkill&#8221; and refuse to do it</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!djes!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!djes!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png 424w, https://substackcdn.com/image/fetch/$s_!djes!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png 848w, https://substackcdn.com/image/fetch/$s_!djes!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png 1272w, https://substackcdn.com/image/fetch/$s_!djes!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!djes!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png" width="1210" height="339" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/22643930-1be0-4733-b144-ef4c8e461300_1210x339.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:339,&quot;width&quot;:1210,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:61400,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178750698?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!djes!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png 424w, https://substackcdn.com/image/fetch/$s_!djes!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png 848w, https://substackcdn.com/image/fetch/$s_!djes!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png 1272w, https://substackcdn.com/image/fetch/$s_!djes!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F22643930-1be0-4733-b144-ef4c8e461300_1210x339.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2>The 2010s Parallel: We&#8217;ve Been Here Before</h2><p>If the MCP architecture sounds familiar, that&#8217;s because it resembles something libraries tried two decades ago: <a href="https://federatedsearchblog.com/2009/03/19/beyond-federated-search/">federated search</a> and <a href="http://www.tandfonline.com/doi/abs/10.1080/19322909.2011.573533">eventually abandoned</a>.</p><h3>The Rise and Fall of Federation</h3><p>Before Web Scale Discovery or Discovery layers in libraries, in the mid to late 2000s, if you wanted to search across multiple databases simultaneously, you used <a href="https://openlab.citytech.cuny.edu/thecoolfoxes/files/2014/05/Lost-in-Translation_The-Reality-of-Federated-Searching.pdf">meta-search or federated search</a>. A meta-search system would let you select a few database connectors, enter your query, and the system would translate it to appropriate syntax and send it to each database in real time. Responses would return to your federated search tool, which would combine and display results.</p><p>In practice, this led to slow responses, frequent errors when connectors broke, and terrible ranking. The ranking problem was particularly acute: metadata wasn&#8217;t uniform across sources, and reranking results arriving at different times from multiple sources proved nearly impossible. The technology was slow and unreliable and though many libraries employed it, it was never popular and libraries hungered for a &#8220;one-search&#8221; that worked better.</p><h3>Web Scale Discovery Takes Over</h3><p>In the early-to-mid 2010s, a new approach emerged: Web Scale Discovery. Products like ProQuest&#8217;s Summon, EBSCO Discovery Service, Ex Libris Primo (now under the same owner as ProQuest), and OCLC&#8217;s WorldCat Discovery raced to build large centralised indexes of academic content.</p><p>This was libraries&#8217; attempt to match Google Scholar&#8212;providing a single search box over all academic content. Back then, people wondered: would publishers provide content to these discovery vendors?</p><p>Evidence mounted that opting out meant plummeting usage while competitors who opted in gained ground. Eventually, most content owners capitulated. </p><p>Still, the debate at the time in the early to mid 2010s was whether to <a href="https://federatedsearchblog.com/2009/03/19/beyond-federated-search/">&#8220;index when you can, federate when you must&#8221;</a> (Ebsco Discovery Service) or just rely on centralized index alone (Summon service)&#8212;and <a href="http://www.tandfonline.com/doi/abs/10.1080/19322909.2011.573533">centralised indexing as the only method won decisively.</a></p><p>By the mid 2010s even Ebsco Discovery Service stopped offering federated search because most journal publishers (even Elsevier) opted in to being indexed. As such the added value of federating the remaining content (e.g. newspapers, law databases) was too low to be worth the complexity to setup and maintain and most users didn&#8217;t want to wait anyway.</p><blockquote><p>The story was actually had further nuances, especially the rivalry between ProQuest and EBSCO&#8212;both discovery vendors (Summon and EDS) AND content aggregators. This led to issues like reluctance to exchange metadata properly and problems linking to aggregator content when using a competitor&#8217;s discovery system.</p></blockquote><h3>The AI Search Index Problem</h3><p>Today&#8217;s AI search tools face a similar challenge. Startups like Elicit, Consensus, and Undermind.ai rely on the Semantic Scholar Corpus and OpenAlex. Others like SciSpace and Scite have mostly scraped the open web. This limits full-text access to Open Access content and whatever publisher partnerships vendors can negotiate.</p><blockquote><p>Generic deep research tools like OpenAI and Gemini Deep Research spin up virtual browsers to browse like humans, but they face the same limitations and cannot access paywalled content <a href="https://substack.com/@aarontay/note/c-139347721">unless there is some mechanism to stop and allow users to sign in .</a> While you can do this with OpenAI&#8217;s agent, I don&#8217;t see content owners being happy with allowing this</p></blockquote><p>Some progress has been made&#8212;Scite, Consensus and even Semantic Scholar themselves have announced publisher partnerships. But they&#8217;re far from covering even the majority of publishers. Even Elsevier, despite having full-text access to their own content, holds only a minority of all academic full-text.</p><p>The only player sitting on a substantial crawled full-text corpus was <a href="https://www.nature.com/articles/d41586-024-03746-y">Google Scholar&#8212;and until recently, they hadn&#8217;t used it for &#8220;AI</a>&#8221;. The<a href="https://aarontay.substack.com/p/scholar-labs-early-review-google"> launch of Scholar Labs </a>was a step forward, but focuses on finding papers rather than generating synthesised answers.</p><blockquote><p>Another player I am curious are the winners of the last &#8220;Academic content war&#8221;, Ebsco and Clarivate (now owner of both Summon and Primo). Clarivate&#8217;s CDI (<a href="https://knowledge.exlibrisgroup.com/Primo/Content_Corner/Central_Discovery_Index/Documentation_and_Training/Documentation_and_Training_(English)/CDI_-_The_Central_Discovery_Index/010An_Overview_of_the_Ex_Libris_Central_Discovery_Index_(CDI)">Central Discovery Index estimated at 5 billion records</a>) is probably the only single source of academic content that can rival Google Scholar&#8217;s. I am unsure how much of it is full-text (<a href="https://knowledge.exlibrisgroup.com/Primo/Content_Corner/Central_Discovery_Index/Documentation_and_Training/Documentation_and_Training_%28English%29/CDI_-_The_Central_Discovery_Index/130Full_Text_Indexing_in_CDI">CDI stores first 65k characters of text when available</a>) but you can already see some publishers like <a href="https://knowledge.exlibrisgroup.com/Primo/Product_Documentation/020Primo_VE/Primo_VE_(English)/015_Getting_Started_with_Primo_Research_Assistant#:~:text=between%20LLM%20versions.-,Content%20Scope,Any%20content%20published%20by%20the%20providers%20above%20coming%20via%20aggregator%20collections.,-These%20details%20will">Elsevier opt out from products like Primo/Summon Research Assistant</a></p></blockquote><p>This month, I also heard about<a href="https://www.elsevier.com/academic-and-government/ai-for-researchers"> Elsevier&#8217;s LeapSpace</a>, reportedly covering 15+ million peer-reviewed full-text articles not just from Elsevier&#8217;s ScienceDirect and Scopus products but also from other publishers.  There was a previous product called ScienceDirect AI, but it seems all existing customers of that product will be transfered to LeapSpace, which suggests Elsevier hopes to go beyond just their own content.</p><p>Will anyone succeed in building comprehensive indexes? Will publishers cooperate as they did for Web Scale Discovery?</p><p></p><h2>Implications of MCP Servers for Academic Content</h2><p>I&#8217;ve been testing these MCP servers for a month and am still absorbing the implications - which probably can be a subject of many future posts. But here are my initial thoughts.</p><h3>Will This Model Catch On?</h3><p>MCP servers represent the federated approach: real-time queries to distributed content sources rather than centralised indexing. Last time, federation lost. But three things have changed:</p><p><strong>Content owners are newly cautious.</strong> With intense concerns about AI training on copyrighted content, publishers are far less willing to hand over full text or even title abstracts for centralised indexing. MCP servers let them maintain control&#8212;content stays on their infrastructure.</p><p><strong>The technology has matured.</strong> The problems that plagued old-school federation&#8212;slow responses, broken connectors, terrible ranking&#8212;are more tractable today. LLMs are remarkably capable of synthesising results from multiple sources with different metadata schemas. They can handle the &#8220;messy&#8221; reranking problem that defeated 2000s-era federated search.</p><p><strong>User expectations have shifted.</strong> Federated search was unacceptably slow in 2010. But today&#8217;s users have been trained to wait longer by Deep Search/Deep Research tools that openly take minutes. A few extra seconds for MCP server calls is no longer a dealbreaker.</p><p>Still, for efficiency, systems will want to minimise MCP server calls. We might see content owners organising around large aggregate MCP servers&#8212;by publisher? By field?</p><h2>Business Models</h2><p>How will content owners price MCP access? Will it be tied to institutional subscriptions? Or decoupled entirely?</p><p>One model I&#8217;ve heard discussed mimics Spotify: searching incurs a nominal fee (per-search or per-chunk/token), with content owners paid based on usage. Full-text access would be charged separately. This could appeal to those who want to pay only for what they use rather than subscribing to bundles.</p><p>I can already hear librarians grumbling about publishers finding yet another way to monetise the same content. But imagine a model where you no longer subscribe to big bundles of journals and only pay for what your users use.</p><p>See more discussion on <a href="https://pubtechradar.substack.com/p/big-ideas-in-publishing-jonathan">business models here.</a></p><h3>Impact on discovery vendors</h3><p>If MCP-based content access catches on, this could be both a opportunity and threat to early AI discovery vendors like Elicit and Consensus.</p><p>They could use MCP servers to supplement their existing indexes (unclear about the buiness model), but once it becomes common for major LLM platforms (ChatGPT, Gemini, Claude, DeepSeek, etc or even open weight models) to allow direct academic content access via MCP, the reason to use specialised academic tools diminishes. Many users will prefer sticking with tools they already know.</p><p>In terms of effectiveness, if MCP servers are the major way in which content is retrieved, this makes Discovery products and agents more reliant on the sophistication of the retrieval step built-in by the MCP server. </p><p>As we have seen, the Wiley AI Gateway server has a couple of quirks and a discovery vendor like Elicit or Undermind or Scite.ai using it would be subject to the limitations of what the Wiley AI Gatewat can retrieve as opposed to designing their own retrieval mechanism for content that is indexed centrally.</p><h3>For Librarians</h3><p><a href="https://aarontay.substack.com/p/were-good-at-search-just-not-the">Understanding information retrieval at a technical level becomes even more important as we evaluate these tools</a>. The transparency Wiley has committed to is encouraging&#8212;I hope it sets a standard.</p><p>The most exciting development is the new capability for Boolean search strategy testing. For the last 3 years, we&#8217;ve found that LLMs couldn&#8217;t match human expert searchers at generating systematic review searches. Now the comparison changes. The question isn&#8217;t whether Claude can generate a perfect search string from scratch&#8212;it&#8217;s whether Claude can help refine, test, and improve strategies that human experts develop.</p><h2>Conclusion</h2><p>MCP represents a potential paradigm shift in how AI accesses academic content. Rather than the centralised index model that dominated Web Scale Discovery, we may be entering an era of AI-native federated search&#8212;with better technology, greater transparency, and new business models.</p><p>The parallels to the 2000s are instructive but not determinative. The incentives have shifted, the technology has improved, and user patience has grown. Whether MCP-based access becomes the dominant model or supplements centralised indexes remains to be seen.</p><p>I&#8217;ll continue testing and will share more findings in future posts. Have you experimented with MCP servers for academic search? I&#8217;d love to hear your experiences.</p><p><em> </em></p>]]></content:encoded></item><item><title><![CDATA[Scholar Labs Early Review: Google Scholar Finally Enters the AI Era]]></title><description><![CDATA[Generated by Nano-Banana Pro from text of this blog post]]></description><link>https://aarontay.substack.com/p/scholar-labs-early-review-google</link><guid isPermaLink="false">https://aarontay.substack.com/p/scholar-labs-early-review-google</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Thu, 20 Nov 2025 20:40:08 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!sxVR!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!sxVR!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!sxVR!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!sxVR!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!sxVR!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!sxVR!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!sxVR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg" width="1024" height="559" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:559,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:167331,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpeg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!sxVR!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg 424w, https://substackcdn.com/image/fetch/$s_!sxVR!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg 848w, https://substackcdn.com/image/fetch/$s_!sxVR!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!sxVR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc92ca9c8-0acf-4459-b206-63609d4c3d30_1024x559.jpeg 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em>Generated by Nano-Banana Pro from text of this blog post</em></p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee! (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee! (via ko-fi)</span></a></p><p>As &#8220;AI-powered academic search engines&#8221; began their rise in 2023, the biggest question on everyone&#8217;s mind was: Where is Google Scholar?</p><p>While <a href="https://gemini.google/overview/deep-research/">Gemini Deep Research came and went</a>, it relied primarily on the general web&#8212;similar to its rival, OpenAI Deep Research. Crucially, it failed to leverage Google&#8217;s greatest competitive advantages: the Google Scholar index and Google Books.</p><p> In a November 2024 piece for <em>Nature</em> (&#8221;<a href="https://www.nature.com/articles/d41586-024-03746-y">Can Google Scholar survive the AI revolution?</a>&#8221;), Anurag Acharya, a founder of Google Scholar, noted that they already utilized &#8220;AI&#8221; in ranking. He expressed skepticism regarding the accuracy of LLMs when summarizing multiple papers.</p><p>I believe that perspective missed the point. While traditional information retrieval algorithms are technically &#8220;AI,&#8221; the academic community was asking for the specific power of LLM-based methods. We wanted tools that could deliver significantly higher precision and recall.</p><p>I <a href="https://aarontay.substack.com/p/what-academic-deep-research-is-really">wrote this in August 2025</a></p><blockquote><p><strong>Thought Experiment:</strong> Imagine Google Scholar with Deep Search: AI2 PaperFinder/Undermind-style iteration and LLM ranking across the full corpus. No long-form prose, no fabricated references&#8212;just outrageously good rankings. Academics don&#8217;t need sub-second latency; they need better ranking of top-k. </p></blockquote><p>TL;DR: Google might have done exactly that (with K = 300) via their new product, Scholar Labs.</p><h2>Google Scholar enters the &#8220;AI&#8221; fray</h2><p>On November 18, 2025&#8212;while most of the internet was abuzz about the launch of Gemini 3&#8212;Google Scholar quietly dropped this blog post: <em><a href="https://scholar.googleblog.com/2025/11/scholar-labs-ai-powered-scholar-search.html">Scholar Labs: An AI Powered Scholar Search.</a></em></p><p>(Note: The official name appears to be &#8220;Scholar Labs,&#8221; not &#8220;Google Scholar Labs&#8221;, which is a odd choice in my view).</p><p>At 4 PM Singapore time, <a href="https://www.linkedin.com/posts/monicawestin_scholar-labs-an-ai-powered-scholar-search-activity-7396810160402505730-WFsK?utm_source=share&amp;utm_medium=member_desktop&amp;rcm=ACoAAADydNkB8cFBZ48tGuFjE4yHqQ6N6mBWEyE">Monica Westin (a former member of the Google Scholar team) posted about the launch on LinkedIn, tagging me</a>. Naturally, I couldn&#8217;t resist testing it. </p><p>There appears to be a waitlist; the criteria for access remain unclear as I immediately had access (you do need to be signed in). If you happen to be on the waitlist, you can try with your education Google account - I hear that works for some when their personal Google account doesn't.</p><p>How does Scholar Labs work? Here is the little they have said about it so far:</p><blockquote><p>It analyzes your question to identify its key topics, aspects and relationships. It then searches for all of them on Scholar, and evaluates the results to identify papers that answer the overall research question. For each paper, it explains how the paper answers your question. And includes all the familiar Scholar features that you depend upon.</p></blockquote><p>This unfortunately is so generic as to be almost useless, so read on to know more.</p><blockquote><p>It has been 24 hours since I started testing this, and these are my early impressions. Everything I blog here may turn out to be inaccurate, or the features may change swiftly by the time you read this. Still, it is worth documenting these first thoughts.</p></blockquote><h2>Scholar Labs is &#8220;Deep Search&#8221; not &#8220;Deep Research&#8221;</h2><p>The Verdict: Scholar Labs is an interesting first attempt at adding Generative AI into the search engine. However, they are doing it in a notably conservative way.</p><p>In short, Scholar Labs is what I classify as <a href="https://aarontay.substack.com/p/why-i-think-academic-deep-research#:~:text=From%20there%2C%20we%20can%20map%20AI%2Dpowered%20search%20tools%20into%20four%20quadrants%3A">&#8220;Deep Search&#8221; tool, not &#8220;Deep Research&#8221;.</a></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!RtYY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!RtYY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png 424w, https://substackcdn.com/image/fetch/$s_!RtYY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png 848w, https://substackcdn.com/image/fetch/$s_!RtYY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png 1272w, https://substackcdn.com/image/fetch/$s_!RtYY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!RtYY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png" width="983" height="577" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:577,&quot;width&quot;:983,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:92075,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!RtYY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png 424w, https://substackcdn.com/image/fetch/$s_!RtYY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png 848w, https://substackcdn.com/image/fetch/$s_!RtYY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png 1272w, https://substackcdn.com/image/fetch/$s_!RtYY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6ffe9021-232f-4967-bed6-89b43dd5c7cf_983x577.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>The main differentiator is that a Deep Search tool is designed to find relevant papers and not generate direct answers. It differs from normal search by going &#8220;deeper,&#8221; running beyond the typical 1000ms latency you expect from Google or conventional databases.</p><p>What is that extra time/compute spent on? Typically, one or both of the following:</p><ul><li><p>Iterative Strategy: The LLM may &#8220;decide&#8221; how and what to search in an iterative fashion.</p></li><li><p>Relevance Reasoning: The LLM is used directly to assess papers and generate a &#8220;rationale&#8221; on why a paper is relevant to the query</p></li></ul><p>Deep Search tools function like conventional search engines&#8212;they give you a list of results&#8212;but with the added bonus of generated text explaining why the AI thinks the paper is relevant. This usually results in much higher precision than traditional ranking methods.</p><p><a href="https://allenai.org/blog/paper-finder">AI2 Paper Finder</a> (now under <a href="https://asta.allen.ai/discover?redirect_from=paper-finder">ASTA</a>) was the clearest flag-bearer of this class of products; it is now joined by Scholar Labs.</p><p>This differs from simple RAG (Retrieval Augmented Generation) or Deep Research tools (e.g., Gemini Deep Research, Scopus Deep Research), which attempt to generate an answer by synthesizing across multiple papers. That is a much trickier task than the Deep Search paradigm of &#8220;screening&#8221; individual papers, as it requires balancing findings from multiple papers that may contradict one another or operate in different contexts. </p><p>Given the <a href="https://www.nature.com/articles/d41586-024-03746-y">Google Scholar team&#8217;s comments in Nature (Nov 2024)</a>, it is perhaps unsurprising they chose the safer &#8220;Deep Search&#8221; paradigm for Scholar Labs which evaluates paper by paper for the relatively clear task of relevancy to the query.</p><p></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p> </p><h3><strong>Scholar Labs: The First Run</strong></h3><div id="youtube2-UE-N0rru8HU" class="youtube-wrap" data-attrs="{&quot;videoId&quot;:&quot;UE-N0rru8HU&quot;,&quot;startTime&quot;:null,&quot;endTime&quot;:null}" data-component-name="Youtube2ToDOM"><div class="youtube-inner"><iframe src="https://www.youtube-nocookie.com/embed/UE-N0rru8HU?rel=0&amp;autoplay=0&amp;showinfo=0&amp;enablejsapi=0" frameborder="0" loading="lazy" gesture="media" allow="autoplay; fullscreen" allowautoplay="true" allowfullscreen="true" width="728" height="409"></iframe></div></div><p>While I classify Scholar Labs as &#8220;Deep Search,&#8221; being Google, they bring their own twist to the formula.</p><p>Here&#8217;s a walkthrough if you don&#8217;t want to watch the video:</p><p>First, you enter your query. Like most modern AI tools, the input field encourages natural language. Once you enter your input, a sidebar appears showing the process, while the main column populates with papers it deems relevant.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Po2L!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Po2L!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png 424w, https://substackcdn.com/image/fetch/$s_!Po2L!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png 848w, https://substackcdn.com/image/fetch/$s_!Po2L!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png 1272w, https://substackcdn.com/image/fetch/$s_!Po2L!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Po2L!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png" width="1456" height="809" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:809,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:85839,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Po2L!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png 424w, https://substackcdn.com/image/fetch/$s_!Po2L!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png 848w, https://substackcdn.com/image/fetch/$s_!Po2L!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png 1272w, https://substackcdn.com/image/fetch/$s_!Po2L!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff8f4225a-c324-4860-a4c3-f403e622a5bf_1696x942.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Step One : <strong>Query Analysis</strong>: It begins by &#8220;analyzing your question&#8221; to decide how to search. Behind the scenes, it is likely performing <a href="https://en.wikipedia.org/wiki/Query_understanding">query understanding</a>, possibly using an LLM like Gemini or other Information Retrieval techniques.</p><p> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Ble8!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Ble8!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png 424w, https://substackcdn.com/image/fetch/$s_!Ble8!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png 848w, https://substackcdn.com/image/fetch/$s_!Ble8!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png 1272w, https://substackcdn.com/image/fetch/$s_!Ble8!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Ble8!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png" width="1456" height="413" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:413,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:40874,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Ble8!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png 424w, https://substackcdn.com/image/fetch/$s_!Ble8!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png 848w, https://substackcdn.com/image/fetch/$s_!Ble8!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png 1272w, https://substackcdn.com/image/fetch/$s_!Ble8!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F76c5a8a7-80cb-4e9c-9e8f-c8acf697d6b2_1781x505.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Step Two : <strong>Query Expansion and Execution</strong>: The interface indicates it runs multiple queries (e.g., in one test, it ran 11 different queries). The results are likely combined, de-duped, and re-ranked.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!IXll!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!IXll!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png 424w, https://substackcdn.com/image/fetch/$s_!IXll!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png 848w, https://substackcdn.com/image/fetch/$s_!IXll!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png 1272w, https://substackcdn.com/image/fetch/$s_!IXll!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!IXll!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png" width="1138" height="483" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:483,&quot;width&quot;:1138,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:24562,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!IXll!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png 424w, https://substackcdn.com/image/fetch/$s_!IXll!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png 848w, https://substackcdn.com/image/fetch/$s_!IXll!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png 1272w, https://substackcdn.com/image/fetch/$s_!IXll!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4d8fc616-de25-4ada-ac31-7c31400936e6_1138x483.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Step Three :<strong> Evaluation:</strong> Scholar Labs then displays that it has &#8220;evaluated X top results,&#8221; providing a running count of evaluated top results as time goes by.</p><p>Step Four : <strong>Display</strong>: Relevant papers (or at least what Scholar Labs considers relevant) start to appear in the main column as time goes by with standard Scholar features below or to the right of each entry (PDF links, citation counts, Library Links etc). </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!mYq3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!mYq3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png 424w, https://substackcdn.com/image/fetch/$s_!mYq3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png 848w, https://substackcdn.com/image/fetch/$s_!mYq3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png 1272w, https://substackcdn.com/image/fetch/$s_!mYq3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!mYq3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png" width="1456" height="511" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:511,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:136446,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!mYq3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png 424w, https://substackcdn.com/image/fetch/$s_!mYq3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png 848w, https://substackcdn.com/image/fetch/$s_!mYq3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png 1272w, https://substackcdn.com/image/fetch/$s_!mYq3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb156ccb4-7612-4885-882f-05c8bb222f12_1872x657.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>One big difference. Instead of standard snippets about the paper for each relevant found entry, you get <strong><a href="https://scholar.googleblog.com/">generated text explaining the paper&#8217;s relevance</a></strong><a href="https://scholar.googleblog.com/"> and summary</a>. Notably, it does this paper-by-paper and <em>does not</em> attempt to synthesize across multiple papers</p><p>In a typical Deep Search tool (like AI2 PaperFinder), the process runs through sucessive papers until it hits a stopping rule. Scholar Labs appears to have a few specific thresholds:</p><p>With Scholar Labs, it seems to me in most cases, it will stop once it thinks it has found 10 relevant papers. As seen below , it displays it has &#8220;found 10 relevant results&#8221; (though unfortunately it does not show how many top results it evaluated to get there at that point, though clicking the &#8220;more results&#8221; button continues the count from where it stopped earlier again).</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!4BNM!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!4BNM!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png 424w, https://substackcdn.com/image/fetch/$s_!4BNM!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png 848w, https://substackcdn.com/image/fetch/$s_!4BNM!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png 1272w, https://substackcdn.com/image/fetch/$s_!4BNM!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!4BNM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png" width="1055" height="759" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:759,&quot;width&quot;:1055,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:73211,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!4BNM!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png 424w, https://substackcdn.com/image/fetch/$s_!4BNM!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png 848w, https://substackcdn.com/image/fetch/$s_!4BNM!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png 1272w, https://substackcdn.com/image/fetch/$s_!4BNM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F72878a67-dfc5-4a9c-a52a-ddee08e1a6f7_1055x759.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>It&#8217;s not 100% clear what happens when you click more results (hopefully the Google Scholar team can add text to explain), but I think Scholar Labs just goes down the initial list of results to look for more relevant papers. </p><blockquote><p>There&#8217;s also the possibility, that on clicking &#8220;more results&#8221;, the tool issues additional iterative searches (very unlikely?) or there&#8217;s some sort of active learning model that reranks the results (unlikely I think it&#8217;s cleaner just to use the LLM - Gemini 3? to screen). I noticed that the rate of finding relevant papers slows down over time, which is expected.</p></blockquote><p>From most tests, it seems to stop at 10,20,30,40 found relevant papers found milestones, but it seems the hard limit is 50 found relevant papers. The systems seems to cut off immediately (regardless of how many of the top papers it is at) once it found 50 relevant papers and you can no longer ask for more results.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!eTJv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!eTJv!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png 424w, https://substackcdn.com/image/fetch/$s_!eTJv!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png 848w, https://substackcdn.com/image/fetch/$s_!eTJv!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png 1272w, https://substackcdn.com/image/fetch/$s_!eTJv!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!eTJv!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png" width="1163" height="779" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:779,&quot;width&quot;:1163,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:81079,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!eTJv!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png 424w, https://substackcdn.com/image/fetch/$s_!eTJv!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png 848w, https://substackcdn.com/image/fetch/$s_!eTJv!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png 1272w, https://substackcdn.com/image/fetch/$s_!eTJv!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F36e94cff-98f6-49ff-b9e2-d1ccbcbdd336_1163x779.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>In the above example, the query was designed to have many relevant results, and Scholar Labs quickly hit the 50 relevant paper mark without going through too many papers (video shows it evaluates around the top 96th result).</p><p>But what happens if you try a tougher or more specific query, will it keep going on until it finds 50 relevant ones (which may not exist)? Of course not, so far my tests show there is a hard limit at 300 - aka the tool will stop evaluating once it as evaluated the 300th top result and the &#8220;more results&#8221; button vanishes.</p><p>Below shows an example of a query which Scholar Labs terminates the search even though it claims to have found 26 relevant results once it goes past evaluating 300 top results.</p><div id="youtube2-HQJ72CaFzgc" class="youtube-wrap" data-attrs="{&quot;videoId&quot;:&quot;HQJ72CaFzgc&quot;,&quot;startTime&quot;:null,&quot;endTime&quot;:null}" data-component-name="Youtube2ToDOM"><div class="youtube-inner"><iframe src="https://www.youtube-nocookie.com/embed/HQJ72CaFzgc?rel=0&amp;autoplay=0&amp;showinfo=0&amp;enablejsapi=0" frameborder="0" loading="lazy" gesture="media" allow="autoplay; fullscreen" allowautoplay="true" allowfullscreen="true" width="728" height="409"></iframe></div></div><p>Screenshot below shows another example, it stops after finding 30 relevant results (this round number seems to be concidence) but if you were looking at the interface before it displayed this text, you can see it cut off once it evaluated the top 300 result. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!g-dy!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!g-dy!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png 424w, https://substackcdn.com/image/fetch/$s_!g-dy!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png 848w, https://substackcdn.com/image/fetch/$s_!g-dy!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png 1272w, https://substackcdn.com/image/fetch/$s_!g-dy!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!g-dy!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png" width="1456" height="680" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:680,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:175664,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!g-dy!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png 424w, https://substackcdn.com/image/fetch/$s_!g-dy!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png 848w, https://substackcdn.com/image/fetch/$s_!g-dy!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png 1272w, https://substackcdn.com/image/fetch/$s_!g-dy!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F714bf980-3afd-43e6-ade9-de9e721fb534_1903x889.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>As you will see later there are some outliers where the search will hard stop below reachng 300, even if you have not found 50 relevant articles.</p><p></p><h2>Queries accepted by Scholar Labs</h2><p>With &#8220;AI-powered search,&#8221; the natural question is: What can I ask (in natural language)?</p><p>At the most basic level, does it&#8217;s natural language search &#8220;understand&#8221; commands to filter by metadata or fields? Even though Scholar Labs has a sample query that suggests you can ask &#8220;Find papers from past X years on topic Y&#8221;, I am finding it somewhat inconsistent when you state year range.</p><p>Moreover, with the rise of agentic search, we are starting to get used to asking tools to do complex tasks like, &#8220;Find paper X and look for papers it should have cited but didn&#8217;t.&#8221; Scholar Labs is clearly not that agentic. In fact, it is quite strict about allowed queries.</p><p>Many of my &#8220;power user&#8221; queries returned a message stating: &#8220;Scholar Labs is currently not designed for queries like this.&#8221;</p><p>Queries that failed:</p><ul><li><p>Sumarise main points of &lt;paper x&gt;</p></li><li><p>What is figure 1 of &lt;paper x&gt;</p></li><li><p>papers by &lt;author x&gt; on &lt;topic y&gt;</p></li><li><p>Papers referenced by &lt;paper x&gt; and papers cited by &lt;paper x&gt; - are inconsistent</p></li></ul><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!nvCY!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!nvCY!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png 424w, https://substackcdn.com/image/fetch/$s_!nvCY!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png 848w, https://substackcdn.com/image/fetch/$s_!nvCY!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png 1272w, https://substackcdn.com/image/fetch/$s_!nvCY!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!nvCY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png" width="1100" height="313" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/feeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:313,&quot;width&quot;:1100,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:20101,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!nvCY!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png 424w, https://substackcdn.com/image/fetch/$s_!nvCY!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png 848w, https://substackcdn.com/image/fetch/$s_!nvCY!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png 1272w, https://substackcdn.com/image/fetch/$s_!nvCY!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffeeebfc7-0021-4cab-9107-bd6bc940cd7a_1100x313.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Some queries work with errors or inconsistently, such as the query below to find &#8220;books&#8221; but it seems to work showing entries with [books] at least at first, yet others found later do not. </p><p>Incidently, this implies this product has access to the Google Books parts like normal Google Scholar.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!L1j_!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!L1j_!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png 424w, https://substackcdn.com/image/fetch/$s_!L1j_!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png 848w, https://substackcdn.com/image/fetch/$s_!L1j_!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png 1272w, https://substackcdn.com/image/fetch/$s_!L1j_!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!L1j_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png" width="1456" height="726" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:726,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:114242,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!L1j_!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png 424w, https://substackcdn.com/image/fetch/$s_!L1j_!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png 848w, https://substackcdn.com/image/fetch/$s_!L1j_!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png 1272w, https://substackcdn.com/image/fetch/$s_!L1j_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7b2fd5a3-7745-4357-bb0d-7fc5036a9ecc_1836x915.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I have been asked if this product includes case law, I think it doesn&#8217;t this is about articles. I also am fairly certain it never shows patents? and even [citation] entries don&#8217;t appear because there isn&#8217;t enough information to evaluate them on?</p><p>Speculation: This strict filtering might be designed to protect content owner relationships. By blocking &#8220;interrogation&#8221; style queries, Google ensures users still need to access the full text, rather than getting all the details from the AI.</p><h2>Implications for researchers</h2><p>If my assessment of how Scholar Labs works is correct, this is a game-changer solely due to the scale of Google Scholar&#8217;s index.</p><p>Scholar&#8217;s index dwarfs OpenAlex, Semantic Scholar (used by many new &#8220;AI academic search&#8221;), and others. It includes full text from almost every major publisher (allows crawls from Google Scholar). If Scholar Labs inherits this exact index (and isn&#8217;t walled off from paywalled full-text), it should dominate in non-STEM disciplines where other databases are weaker.</p><p>Already when testing searches like </p><p><code>find me papers that mention Elicit.com</code></p><p>it outdoes my favourite Undermind.ai tool simply due to the size of the index. </p><p>It&#8217;s size is so big it often surprises me. </p><p>e.g. I tested it with &#8220;impossible queries&#8221;&#8212;topics I thought had no results&#8212;and it surprised me by surfacing a forgotten PowerPoint slide or obscure paper that mentions that query. </p><p>As such it is probably excellent for finding papers when you have forgotten the title, thought it is not perfect. </p><h2>Weakness of the tool</h2><p>That said, it&#8217;s not the &#8220;one ring&#8221; to rule all of Academic AI search tools.</p><p>Firstly, it is just Deep Search, or &#8220;paper finder&#8221;. I am not underselling how powerful and useful this is, in fact I did a <a href="https://aarontay.substack.com/p/why-i-think-academic-deep-research">whole blog post to say I am more bullish on Deep Search than Deep Research.</a> </p><p>With most AI powered search tools are <a href="https://aarontay.substack.com/p/what-academic-deep-research-is-really">pivoting towards Deep Research, which provide long reports and visualizations that synthesize results across multiple papers,</a> this is something that can be valuable if you this for quickly getting an overview of the land yet this something which Scholar Labs does not touch and likely may not for a while.</p><p>Secondly, the current interface is a bit awkward. I&#8217;ve already seen comments from people complaining it is tiresome to click pressing &#8220;more results&#8221;. Why not let it run longer (until it has evaluated 300 or so results).  I guess as a free product you probably want to save compute, Google is of course rich and powerful but Google Scholar is far more popular than AI2 paper finder&#8230;</p><h3><strong>Inherent Limitations for High-Recall Systematic Reviews</strong></h3><p>While Scholar Labs offers high precision&#8212;and will frankly impress anyone who hasn&#8217;t used this class of tools before&#8212;it is not sufficient on its own for evidence synthesis or systematic reviews, which demand super-high recall. This is because Scholar Labs inherits the inherent limitations of the underlying Google Scholar infrastructure. </p><p>To explain this, we must look at standard practice. A common guideline for evidence synthesis when using Google Scholar is to scan the first 200&#8211;300 results. Scholar Labs appears to automate this approach (ignoring the stop at 50 relevant rule). However, in traditional systematic reviews, this method is used only as a supplement, never as a replacement for the main search process that involves searching across multiple databases.</p><p>Why? Early papers from the 2010s by <a href="https://link.springer.com/article/10.1186/1472-6947-13-7">evidence synthesis experts demonstrated that while Google Scholar&#8217;s index is vast&#8212;often having near 100% coverage of relevant papers found in a review</a>&#8212;findability is a different issue. You can prove this high coverage yourself by taking a completed systematic review and searching Google Scholar by title for the included papers; they are almost always there.</p><p>This begs the question: If the coverage is so high, why not cut out the middleman and use Google Scholar alone? The answer is that while <a href="https://pubmed.ncbi.nlm.nih.gov/26932789/">the papers are indexed (high coverage), finding all of them using only Google Scholar is impractical due to the poor precision caused by its limited search functionality</a>.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!MhYT!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!MhYT!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png 424w, https://substackcdn.com/image/fetch/$s_!MhYT!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png 848w, https://substackcdn.com/image/fetch/$s_!MhYT!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png 1272w, https://substackcdn.com/image/fetch/$s_!MhYT!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!MhYT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png" width="1176" height="386" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:386,&quot;width&quot;:1176,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:71867,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/179354033?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!MhYT!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png 424w, https://substackcdn.com/image/fetch/$s_!MhYT!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png 848w, https://substackcdn.com/image/fetch/$s_!MhYT!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png 1272w, https://substackcdn.com/image/fetch/$s_!MhYT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9459ac65-12c0-4cc7-bc7a-7669cf5cf5d2_1176x386.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Compared to structured databases like PubMed, Scopus, or Embase,<a href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-13-131"> Google Scholar suffers from significant limitations:</a></p><ol><li><p>No complex search logic: Lack of nested Boolean support and no proximity operators. No official support for truncation for word endings. </p></li><li><p>Short queries: Stricter limits on search strategy length (no more than 256 characters). EDIT - Michael Gusenbauer&#8217;s  great work at SearchSmart also <a href="https://www.linkedin.com/posts/mgusenbauer_one-week-after-google-launched-google-activity-7399084534710992898-CgQ4?utm_source=share&amp;utm_medium=member_desktop&amp;rcm=ACoAAADydNkB8cFBZ48tGuFjE4yHqQ6N6mBWEyE">detected a change in Google Scholar support of query length from 256 to 2048 character length! Likely related to Scholar Labs launch</a>.</p></li><li><p>No controlled vocabulary: Limited filters and no MeSH/Emtree equivalents.</p></li><li><p>Limited field searching: In particular. you cannot limit searches to just &#8220;Title/Abstract.&#8221; Because you are searching full-text, you get massive amounts of noise for some query terms</p></li><li><p>Export limits: A lack of bulk export options and a hard cap of 1,000 results.</p></li></ol><p>These limitations make it difficult to craft a single search strategy that captures all relevant results, even if all relevant papers are indexed. A very broad search strategy might work in theory but in pratice you end up having too many false drops (super low precision).</p><blockquote><p><a href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-13-131">One example</a> given was how the Google Scholar strategy when translated from a traditional search strategy from Cochrane Review had to be simplified from a  1,391 characters search strategy that included a large number of drug specific names combined using OR. This simplified Google Scholar, probably led to missing relevant papers. </p></blockquote><p>Worse, even if a search captured them, the lack of abstract-only matching and other features to create precise searches means you would be drowning in noise. </p><p>Finally, even if you will willing to spend more time screening them, the 1,000-result hard cap acts as a final barrier.</p><p>This is not just theortical but has been studied multiple times.</p><p>One study illustrated this perfectly: <a href="https://pubmed.ncbi.nlm.nih.gov/26932789/">Google Scholar had 97.2% coverage (verified via known-item search), but recall dropped to 72.6% when using a real search query (Original Query AND Title AND Author), and plummeted to 46.4% if restricted to the top 1,000 results.</a></p><blockquote><p><a href="https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-13-131">Another study</a> did better and had a higher recall of 92.9% instead of 72.6% (when using a real search query but ignoring the 1,000 results limits) but noted even if you could screen all the returns, you would have a precision of 0.13% which is &gt;20x worse than normal databases! This means you would need to screen 20x more papers to get 1 relevant paper! </p><p>Note that this horrible precision is assuming you screen everything, in reality, precision when screening up to 1,000 is around 1% which isn&#8217;t so bad, but you get a big hit in recall.</p></blockquote><blockquote><p>While most 2010s studies in the medical sciences concluded Google Scholar is too blunt a tool to use alone, some recent studies in the 2020s (focusing on <a href="https://journals.sagepub.com/doi/abs/10.1177/09610006241256393">Social Science</a>, <a href="https://torkar.github.io/pdfs/08984351.pdf">Software Engineering</a>, and even one in <a href="https://link.springer.com/article/10.1007/s12070-023-03532-8">Otolaryngology</a>) suggest otherwise. However, this success is often due to the specific, unique terminology used in those reviews, which prevents the result explosion common in broader searches.  </p></blockquote><p>Ultimately, even with near 100% coverage with the almighty Google Scholar index, failure occurs because:</p><ol><li><p>The paper was in the database, but the search strategy failed to retrieve it</p></li><li><p>The paper was retrieved by the search strategy but fell beyond the 1,000-result hard cap.</p></li></ol><p>How does Scholar Labs change this? Unfortunately, Scholar Labs&#8217; method of running a search and evaluating the top 300 results remains vulnerable to both issues. Even if the system is expert-level at screening, it can only evaluate what it &#8220;sees&#8221; in that top tier. A major improvement would be if Scholar Labs allowed users to evaluate the top 500 or even 1,000 results.</p><blockquote><p>If AI is used for screening, in theory you could compensate for the much poor precision Google Scholar has by &#8220;letting the AI do it&#8221;, but you need to go way past 300 or even 1,000.</p></blockquote><p>Scholar Labs does run multiple queries, which might mitigate the risk of relying on a single, length-limited search string. However, we need testing to see if these generated queries are diverse and effective enough. </p><p>If these multiple queries are simply generated by a prompted LLM, there is reason for pessimism; <a href="https://www.sciencedirect.com/science/article/pii/S0895435625000794">most studies attempting to use LLMs to generate Boolean search strategies for systematic reviews have shown unpromising results</a> (though this focus mostly on PubMed searches).</p><p>Anecdotally, I have already seen Scholar Labs fail to find papers I know exist. Aside from the classic <a href="https://link.springer.com/article/10.1186/1472-6947-13-7">Gehanno et al. (2013)</a> and <a href="https://link.springer.com/article/10.1007/s12070-023-03532-8">Bramer et al. (2013) </a>papers regarding coverage, I tried to find a <a href="https://link.springer.com/article/10.1007/s12070-023-03532-8">more recent paper I knew existed - claiming that reviewing the top 500 Google Scholar results could yield 99% recall</a> but I could not remember the title offhand. Scholar Labs failed to find it initially. I eventually surfaced it by manually altering the query to be more specific and restricting the date range to the last 5 years. This highlights that the tool remains highly sensitive to the specific query entered.</p><p>Finally, there is the concern of &#8220;outsourcing relevance.&#8221; While <a href="https://app.undermind.ai/report/b65b2b0710729959bcc0a6006463c898298622b01b60d5dc7e3a592205e110c5">recent studies on using LLMs for screening are promising, results are heterogeneous and dependent on the model, prompting technique and the domain</a> . Even with high correlation with human judgement I worry about subtle biases&#8212;specifically, that the AI might consistently drop certain types of relevant papers. </p><blockquote><p>In evidence synthesis, we generally tolerate false positives (noise) but fear false negatives (missing data). My initial skimming suggests Scholar Labs produces few false positives, which, paradoxically for a systematic reviewer, raises anxiety about potential false negatives.</p></blockquote><p>As such , I expect evidence synthesis practitioners to be lukewarm about this tool. At best, it automates the supplementary &#8220;Google Scholar check&#8221; they already perform&#8212;perhaps offering slightly better recall via multiple queries&#8212;but it is unlikely to be groundbreaking. They will still need traditional databases to ensure the necessary recall.</p><h2>Implications for discovery vendors</h2><p>In a sense, Google Scholar deciding to play in the AI sandbox is bad news for discovery vendor.s Google Scholar is the 500 pound gorilla in academic search and anything they do will draw attention and be used by researchers.</p><p>That said, currently, they still don&#8217;t occupy the Deep Research space so tools like Undermind, Consensus still have a place.</p><h2>Implications for content owners</h2><p>It&#8217;s interesting that content owners are content with letting Google Scholar use their content (for now) including full text in a &#8220;AI search&#8221;. Granted, this is only for AI Deep Search and with query filtering of certain types of queries, users will still have to download the relevant found paper to read, mitigating content owner&#8217;s greatest fear that users using gen AI can benefit from full text without downloading the content.</p><p>Still with the winds blowing towards distributing content using MCP servers e.g. <a href="https://www.wiley.com/en-us/solutions-partnerships/ai-solutions/">Wiley AI Gateway,</a> perhaps Scholar Labs might be a anomaly because only they have the clout and visibility to be given access to full text?</p><h2>Conclusion</h2><p>This is a quick 24 hour review of a new tool that is likely to cause waves by simply being part of Google Scholar. No doubt much of what I have written is either foolish or totally wrong but that is the price of trying to be early.</p><p>I will end by stating some of my wish lists</p><ul><li><p>Option to extend evaluation of the top 500/1,000 results (premium??) </p></li><li><p>Option to set to stop after every 10/20/30/50 relevant result (premium??)</p></li><li><p>Allowing saving of Scholar Labs search sessions, and even one that can be shared</p></li><li><p>More transparency</p><ul><li><p>show the keyword search used in multiple query </p></li><li><p>show not just found x results but also how many top results have been evaluated (maybe even providing some visualization to show relevant found vs evaluated) when the search stops. </p></li></ul></li><li><p>Could Scholar Labs do citing chasing of found relevant articles by evaluting cites of relevant articles found?</p></li><li><p>Will search alerts be based on this new paradigm of evaluation?</p></li></ul><p></p><p></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[A 2025 Deep Dive of Consensus: Promises and Pitfalls in AI-Powered Academic Search ]]></title><description><![CDATA[The recent addition of Consensus Deep Search mode is a great boost to its retrieval capabilities.&#160;On top of that, it has one of the most appealing interfaces out there, with color-coded references, and the Consensus Meter, for all its methodological faults, is likely to appeal to undergraduates and less advanced users. Add advanced pre-filters and LibKey integration to institutional full-text, and it is easy to guess this will be a hit for many users doing narrative literature reviews.]]></description><link>https://aarontay.substack.com/p/a-2025-deep-dive-of-consensus-promises</link><guid isPermaLink="false">https://aarontay.substack.com/p/a-2025-deep-dive-of-consensus-promises</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Sat, 15 Nov 2025 21:47:51 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!Czne!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg" length="0" type="image/jpeg"/><content:encoded><![CDATA[<p>Academic librarians are increasingly being asked about AI-powered search tools that promise to revolutionize literature discovery. </p><p><a href="http://consensus.app">Consensus</a> is one of the more prominent and earliest players in this space (alongside <a href="http://elicit.com">Elicit</a>, <a href="https://www.perplexity.ai/">Perplexity</a>), positioning itself as a tool that can not only find relevant papers but assess the &#8220;consensus&#8221; of research on a topic. Singapore Management University Libraries recently acquired institutional access to both Consensus and Undermind.ai, giving me the opportunity to evaluate these tools in depth. </p><p>This review examines Consensus&#8217;s capabilities, critically assesses some unique features offered, and as a bonus compares it with Undermind.ai.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee! (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee! (via ko-fi)</span></a></p><h2>Core Functionality: How Consensus Works</h2><p>At a basic level, Consensus operates like many AI-powered academic search tools. You type a natural-language question, the system searches its index, and returns an AI-generated answer with citations. The interface is clean, and the documentation (<a href="https://consensus.app/home/blog/best-practices/">search best-practice guide</a> and <a href="https://help.consensus.app/en/articles/9922891-consensus-guide-how-to-write-a-literature-review-or-dissertation">tutorial</a>) is clear and approachable.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!yXgt!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!yXgt!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png 424w, https://substackcdn.com/image/fetch/$s_!yXgt!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png 848w, https://substackcdn.com/image/fetch/$s_!yXgt!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png 1272w, https://substackcdn.com/image/fetch/$s_!yXgt!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!yXgt!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png" width="1167" height="462" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/acc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:462,&quot;width&quot;:1167,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:23715,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!yXgt!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png 424w, https://substackcdn.com/image/fetch/$s_!yXgt!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png 848w, https://substackcdn.com/image/fetch/$s_!yXgt!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png 1272w, https://substackcdn.com/image/fetch/$s_!yXgt!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Facc2be0c-afb5-4ecf-af69-c45966087cec_1167x462.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>You can of course just type in your question or topic in natural language, but when using such tools, I like to look at what the interface suggests as possible inputs, which gives you a hint of what it is capable of. </p><p>I personally, think listing &#8220;Try a Deep Search&#8221; and &#8220;Try the Consensus Meter is somewhat confusing here since it doesn&#8217;t actually suggest what to input but instead turns on different modes.</p><p>&#8220;Draft an outline&#8221; and &#8220;Create a table&#8221; does give you sample inputs you can try but I suspect most people just ignore it and type naturally what they want - which works.</p><p>So far, so familiar. Where things get interesting is in the data sources, ranking architecture, and&#8212;most controversially&#8212;the &#8220;Consensus Meter.&#8221;</p><p> </p><h3>Data Sources and Coverage</h3><p>Consensus draws <a href="https://consensus.app/home/blog/how-consensus-works/#:~:text=What%20Does%20Consensus%20Search%20Over%3F">primarily from open sources, particularly OpenAlex and Semantic Scholar, giving it access to approximately 200 million papers including preprints.</a> </p><p>In practice this means:</p><ul><li><p>Consensus usually has <strong>abstracts</strong> for most indexed papers</p></li><li><p>It has <strong>full text</strong> only for open access articles (plus a small slice from publisher partnerships)</p></li></ul><p> How does this compare with traditional databases?</p><ul><li><p>Web of Science: ~100 million records</p></li><li><p>Scopus: ~90 million records</p></li></ul><p>Consensus appears &#8220;bigger&#8221; mainly because it includes preprints and more open access material. But the key constraint is <strong>full-text access</strong>. For most paywalled content, it is working from titles and abstracts only.</p><p>For librarians, this matters:</p><ul><li><p>In fields with strong OA penetration (e.g. computer science, high-energy physics, genomics), Consensus may have very good full-text coverage.</p></li><li><p>In fields where paywalls dominate (humanities, many social sciences), Consensus is often doing abstract-only analysis on a large proportion of the literature.</p></li></ul><p>None of this is unique to Consensus, as many of its competitors like Elicit.com, Undermind.ai are in the same boat.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><h3>Search Architecture and Quality Signals</h3><p>Consensus uses what is now a fairly industry standard retrieval stack:</p><ul><li><p><strong><a href="https://consensus.app/home/blog/how-consensus-works/#:~:text=How%20Does%20a%20Consensus%20Search%20Work%3F">Hybrid search</a></strong><a href="https://consensus.app/home/blog/how-consensus-works/#:~:text=How%20Does%20a%20Consensus%20Search%20Work%3F"> combining keyword and semantic (embedding-based) search</a></p></li><li><p><strong><a href="https://consensus.app/home/blog/how-consensus-works/#:~:text=After%20the%20initial%20relevance%20filter%2C%20we%20take%20the%20top%201%2C500%20papers%20and%20re%2Drank%20them%2C%20not%20just%20by%20how%20well%20they%20match%20your%20query%2C%20but%20also%20by%20how%20strong%20the%20research%20is.">Multi-stage ranking</a></strong>, including:</p><ul><li><p>Initial hybrid retrieval (top ~1,500 results)</p></li><li><p>Reranking by query relevancy match and &#8220;<a href="https://consensus.app/home/blog/how-consensus-works/#:~:text=After%20the%20initial%20relevance%20filter%2C%20we%20take%20the%20top%201%2C500%20papers%20and%20re%2Drank%20them%2C%20not%20just%20by%20how%20well%20they%20match%20your%20query%2C%20but%20also%20by%20how%20strong%20the%20research%20is.">research strength&#8221; (citation counts, recency, journal reputation)</a></p></li><li><p>A final pass that selects the top 20 (for pro mode).</p></li></ul></li></ul><p>The interesting bit is the explicit attempt to rank not only by textual relevance, but also by <strong>proxies for research quality</strong> (citations, study design, journal-level signals). This is common in traditional academic search (think Google Scholar), but still relatively rare among newer AI search tools that often optimise purely for semantic similarity.</p><p>However, these quality signals in my view come with serious caveats.</p><blockquote><p>As of this writing, Consensus has announced <a href="https://openai.com/index/consensus/">&#8220;Scholar Agent&#8220; in collaboration with OpenAI</a>, deployed in &#8220;Pro&#8221; and &#8220;Deep&#8221; modes (we will discuss this later). This means Consensus <a href="https://developers.openai.com/blog/responses-api/">now uses GPT-5 through the response API, with specialized planning, search, and reading agents working together (see post for flow diagram)</a>.</p></blockquote><h2>Quality Signals and Study Classification</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!NElm!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!NElm!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png 424w, https://substackcdn.com/image/fetch/$s_!NElm!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png 848w, https://substackcdn.com/image/fetch/$s_!NElm!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png 1272w, https://substackcdn.com/image/fetch/$s_!NElm!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!NElm!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png" width="1227" height="608" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:608,&quot;width&quot;:1227,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:80897,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!NElm!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png 424w, https://substackcdn.com/image/fetch/$s_!NElm!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png 848w, https://substackcdn.com/image/fetch/$s_!NElm!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png 1272w, https://substackcdn.com/image/fetch/$s_!NElm!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0caf4193-16e8-4ab9-880d-c4b39374f791_1227x608.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>As mentioned, Consensus rankings take into account research quality signals like citation counts, method used (RCT, systematic review, meta-analysis) and the journal reputation (&#8220;rigorous journals&#8221;) and the retrieved references will often be tagged with these signals.</p><p>Of the research quality signals, the one using journal reputation is of course the most dubious, though one could even argue that judging quality by method might not be a good idea, as knowing a study is an RCT might not tell you whether the RCT is properly conducted or not&#8230; (with the added complication that the method is extracted and assigned by the LLM).</p><h3>Journal Quality Metrics</h3><p>In Consensus, papers are tagged based on journal reputation using  <a href="https://www.sciscore.com/rti/overview.php">SciScore</a>, with &#8220;rigorous journals&#8221; being in the top 50th percentile and &#8220;very rigorous journals&#8221; in the top 10th percentile. This percentile ranking claims to &#8220;<strong><a href="https://www.scicrunch.com/consensus-partnership">help users better understand the quality of their search results</a></strong>&#8220;</p><p><strong>What is SciScore?</strong> <a href="https://www.sciscore.com/rti/overview.php">SciScore </a>is a tool that evaluates papers on research rigor criteria like whether appropriate authentication of key biological resources is reported, use of randomization and blinding, sample size calculations, and data/code availability. It produces both article-level and journal-level scores.</p><p><strong>Some Issues</strong></p><ul><li><p><strong>Container &#8800; content. </strong>Even the most &#8220;rigorous&#8221; journals publish weak or even retracted studies. Using journal score as a shortcut for article quality is methodologically shaky (see DORA).</p></li><li><p><strong>Perverse incentives. </strong>High-impact journals preferentially publish novel, surprising findings, which are more likely to fail replication. Prestige and reliability are not the same thing.</p></li><li><p><strong>Field specificity.</strong> SciScore is optimised for biomedical research.  How well do these criteria translate to economics, sociology, or computer science? </p></li><li><p><strong>Citation bias.</strong> Citation counts are highly field- and document-type dependent. Reviews and methods papers accumulate citations very differently from niche empirical work. Does Consensus normalize for this?</p></li></ul><h3>LLM-Based Study Design and &#8220;Study Snapshots&#8221;</h3><p>Consensus also uses LLMs to classify study designs (meta-analysis, RCT, systematic review, cohort study, etc.) and to extract:</p><ul><li><p>Population</p></li><li><p>Methods</p></li><li><p>Sample size</p></li><li><p>Outcomes</p></li><li><p>Results</p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!OyT-!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!OyT-!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png 424w, https://substackcdn.com/image/fetch/$s_!OyT-!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png 848w, https://substackcdn.com/image/fetch/$s_!OyT-!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png 1272w, https://substackcdn.com/image/fetch/$s_!OyT-!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!OyT-!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png" width="1456" height="745" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:745,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:168877,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!OyT-!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png 424w, https://substackcdn.com/image/fetch/$s_!OyT-!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png 848w, https://substackcdn.com/image/fetch/$s_!OyT-!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png 1272w, https://substackcdn.com/image/fetch/$s_!OyT-!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbf2832a8-0ee9-4785-86fe-32c20cd2c459_1599x818.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>These power the &#8220;Study Snapshots&#8221; for individual papers. It&#8217;s a genuinely useful feature, especially for quick triage. But the classifications are AI-generated and can be wrong.</p><h2>The Consensus Meter: Reading the Room or Miscounting Votes?</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!RVEn!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!RVEn!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png 424w, https://substackcdn.com/image/fetch/$s_!RVEn!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png 848w, https://substackcdn.com/image/fetch/$s_!RVEn!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png 1272w, https://substackcdn.com/image/fetch/$s_!RVEn!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!RVEn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png" width="813" height="717" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/dd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:717,&quot;width&quot;:813,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!RVEn!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png 424w, https://substackcdn.com/image/fetch/$s_!RVEn!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png 848w, https://substackcdn.com/image/fetch/$s_!RVEn!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png 1272w, https://substackcdn.com/image/fetch/$s_!RVEn!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdd0c1fea-2f57-470c-b4eb-21834f67f3cb_813x717.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The flagship feature is the <strong>Consensus Meter</strong>, which tries to summarise what the literature &#8220;says&#8221; about a given question by categorising papers into &#8220;yes&#8221;, &#8220;no&#8221;, &#8220;mixed&#8221;, or &#8220;possibly&#8221; and then visualising the distribution.</p><p>For example, for the query:</p><blockquote><p>&#8220;Do certain personality traits influence career success?&#8221;</p></blockquote><p>Consensus might show something like:</p><ul><li><p>94% (16 papers): <strong>Yes</strong></p></li><li><p>6% (1 paper): <strong>Mixed</strong></p></li></ul><p>You also get context like average publication year, journal quartile, and citation counts per category.</p><p>This is intuitive and eye-catching. <a href="https://www.linkedin.com/posts/mikeacaulfield_reading-the-room-on-azar-gat-claims-activity-7323540251396689922-AX3_/">This informal process where you can a sense of the literature is akin to what Mike Caulfield calls &#8220;reading the room.&#8221;</a> </p><p>This is mind for quick heuristics checks - but under the hood, it is essentially a form of <strong>vote counting</strong>&#8212;an approach evidence synthesis methodologists have spent decades warning against. </p><p> </p><h3>When the Meter Actually Helps</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Czne!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Czne!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg 424w, https://substackcdn.com/image/fetch/$s_!Czne!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg 848w, https://substackcdn.com/image/fetch/$s_!Czne!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!Czne!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Czne!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg" width="729" height="800" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:800,&quot;width&quot;:729,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!Czne!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg 424w, https://substackcdn.com/image/fetch/$s_!Czne!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg 848w, https://substackcdn.com/image/fetch/$s_!Czne!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!Czne!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F80c652a7-c4f5-445a-aa9f-1c3c1bbafb04_729x800.jpeg 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Take another example:</p><blockquote><p>&#8220;Does chess training causally improve academic performance in children?&#8221;</p></blockquote><p>Consensus might show something along the lines of:</p><ul><li><p>41%: &#8220;Yes&#8221;</p></li><li><p>12%: &#8220;Possibly&#8221;</p></li><li><p>24%: &#8220;Mixed&#8221;</p></li><li><p>24%: &#8220;No&#8221;</p></li></ul><p>So far, that looks ambiguous: some yes, some no, some mixed.</p><p>However, if you look closer, you may notice that none of the &#8220;yes&#8221; studies are tier-one evidence (RCTs, systematic reviews, meta-analyses), whereas the more negative conclusions cluster among higher-tier designs. That&#8217;s a genuinely useful pattern to surface.</p><p>Similarly in other examples, you might notice the &#8220;no&#8221; studies tend to be more recent which implies the earlier studies may have been refuted. </p><p>Still, as discussed already signals like Journal tiers, average citation counts and methods are weak quality signals that may have issues. For example, high tier journals do not always imply higher quality articles and it is common for older papers that show positive results to have higher citations vs more recent papers that refute the older papers.</p><h3>Why Vote Counting Is Methodologically Weak</h3><p>In fact, the Consensus Meter embodies a problematic approach to evidence synthesis that the systematic review community largely abandoned decades ago for more formalized methods of evidence synthesis. This is essentially vote-counting&#8212;tallying studies by their conclusions&#8212;which has well-documented limitations:</p><p><strong>1. Equal Weighting Problem</strong>: A small study (n=50) counts the same as a large study (n=5,000). The chess example partially addresses this by flagging tier-one studies, but the meter itself doesn&#8217;t weight by study quality or sample size.</p><p><strong>2. Ignores Effect Sizes</strong>: Two studies might both say &#8220;yes,&#8221; but one finds a small effect (Cohen&#8217;s d=0.1) while another finds a large effect (d=0.8). Vote-counting treats these identically.</p><p><strong>3. Publication Bias Blindness</strong>: Published literature systematically overrepresents positive findings. Consensus search of 200M+ index including preprints helps reduce this but still it does not have the comprehensiveness of a properly done systematic review. A meter showing 80% of papers say &#8220;yes&#8221; might reflect publication bias rather than true consensus. </p><p><strong>4. Heterogeneity of studies</strong>: Papers may address subtly different questions, use different operationalizations, or study different populations. Collapsing these into yes/no/mixed categories loses crucial nuance. Consensus may not be able to assess this distinction as well. </p><p><strong>5. Interpretation Ambiguity</strong>: What does &#8220;possibly&#8221;, &#8220;mixed&#8221; mean? These are extracted judgments, not reported conclusions.</p><p>6. <strong>Lack of quality assessment</strong> : Proper evidence synthesis involves critical appriasal of the included studies to ensure that &#8220;consensus&#8221; is based on rigorous studies only. The fact that Consensus does an inclusive search of 200M+ index helps reduces publication bias but you run into the problem that it is more likely to include poor quality studies. While Consensus does rank studies based on &#8220;quality signals&#8221; but as discussed earlier the way Consensus does this is shaky.  </p><p>To their credit, Consensus does expose some quality signals (e.g. number of &#8220;tier one&#8221; studies, average journal rank), but these are still blunt instruments.</p><p> The right way to think about the Consensus Meter is:</p><ul><li><p><strong>Not</strong> a mini meta-analysis (not that Consensus recommends it to be used this way)</p></li><li><p><strong>More</strong> like the start of a scoping study or &#8220;conversation starter&#8221; about the literature</p></li></ul><p>As such, it can actually be a nice teaching tool for undergraduates&#8212;provided we explicitly discuss its limitations.</p><h2>Search Modes and Filters</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!8L61!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!8L61!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png 424w, https://substackcdn.com/image/fetch/$s_!8L61!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png 848w, https://substackcdn.com/image/fetch/$s_!8L61!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png 1272w, https://substackcdn.com/image/fetch/$s_!8L61!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!8L61!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png" width="831" height="469" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:469,&quot;width&quot;:831,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!8L61!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png 424w, https://substackcdn.com/image/fetch/$s_!8L61!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png 848w, https://substackcdn.com/image/fetch/$s_!8L61!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png 1272w, https://substackcdn.com/image/fetch/$s_!8L61!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F00506c5a-c0de-4a65-8067-e5002931fcdf_831x469.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h3>Quick, Pro, and Deep Modes</h3><p>Consensus offers three effort levels that determine how long it searches and of those ultimately how many it uses to summarize.</p><ul><li><p><strong>Quick</strong>: Summarizes max 10 papers</p></li><li><p><strong>Pro</strong>: Summarizes max 20 papers</p></li><li><p><strong>Deep</strong>: Summarizes max 50 papers (becomes Deep Search with additional features)</p></li></ul><p>I mostly use Deep (enterprise tier gives me 50 runs a month), as I&#8217;m willing to trade time for more coverage. Undergraduates or casual users may gravitate to Quick or Pro. All examples in this post are based on Deep.</p><h3>Filtering: Surprisingly Rich and Transparent</h3><p>Consensus&#8217;s pre-filtering options are one of its standout strengths, especially compared to many AI search competitors:</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!OQTZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!OQTZ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png 424w, https://substackcdn.com/image/fetch/$s_!OQTZ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png 848w, https://substackcdn.com/image/fetch/$s_!OQTZ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png 1272w, https://substackcdn.com/image/fetch/$s_!OQTZ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!OQTZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png" width="1456" height="810" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:810,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!OQTZ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png 424w, https://substackcdn.com/image/fetch/$s_!OQTZ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png 848w, https://substackcdn.com/image/fetch/$s_!OQTZ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png 1272w, https://substackcdn.com/image/fetch/$s_!OQTZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e849fc1-0176-4d41-bc5f-c5b716c2372f_1920x1068.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Standard filters include:</p><ul><li><p>Publication year</p></li><li><p>Scimago Journal Rank</p></li><li><p>Citation count</p></li><li><p>Exclude preprints</p></li></ul><p>More unusual:</p><ul><li><p><strong>Study Design</strong>: Filter by meta-analysis, RCT, systematic review, case study, etc.</p></li><li><p><strong>Sample Size</strong>: Minimum thresholds</p></li><li><p><strong>Field of Study</strong>: 23 disciplines</p></li><li><p><strong>Countries</strong>: 236 countries</p></li><li><p><strong>Medical Mode</strong>: Restricts to ~8M papers from ~50,000 clinical guidelines and top 1,000 medical journals</p></li></ul><p>This can be genuinely useful, but it also reinforces that Consensus is shaped around a STEM/biomedical worldview. The filters and quality markers align more naturally with clinical and experimental work than with qualitative research, theory-heavy fields, or the humanities. </p><h3>Medical mode + uploading of papers</h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!bua1!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!bua1!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png 424w, https://substackcdn.com/image/fetch/$s_!bua1!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png 848w, https://substackcdn.com/image/fetch/$s_!bua1!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png 1272w, https://substackcdn.com/image/fetch/$s_!bua1!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!bua1!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png" width="859" height="620" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:620,&quot;width&quot;:859,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:36642,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!bua1!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png 424w, https://substackcdn.com/image/fetch/$s_!bua1!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png 848w, https://substackcdn.com/image/fetch/$s_!bua1!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png 1272w, https://substackcdn.com/image/fetch/$s_!bua1!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9325807d-dff7-4135-99c9-5b8a6fccb94c_859x620.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Consensus has always had a slant towards medical/life sciences but they have doubled down further with the <a href="https://consensus.app/home/blog/introducing-medical-mode-focused-search-for-clinical-evidence/">recent &#8220;medicine mode&#8221;</a>.</p><p>This is a special limiter that <a href="https://consensus.app/home/blog/introducing-medical-mode-focused-search-for-clinical-evidence/">limits the search to 8 million papers and guidelines from &#8220;top 1000 medical journals and 50,000 clinical guidelines&#8221;.</a></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!0E_X!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!0E_X!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png 424w, https://substackcdn.com/image/fetch/$s_!0E_X!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png 848w, https://substackcdn.com/image/fetch/$s_!0E_X!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png 1272w, https://substackcdn.com/image/fetch/$s_!0E_X!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!0E_X!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png" width="908" height="576" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:576,&quot;width&quot;:908,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:71176,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!0E_X!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png 424w, https://substackcdn.com/image/fetch/$s_!0E_X!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png 848w, https://substackcdn.com/image/fetch/$s_!0E_X!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png 1272w, https://substackcdn.com/image/fetch/$s_!0E_X!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3651ac91-9709-4e34-97cf-25532d365ee3_908x576.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This whitelist by journals no doubt removes results from lesser known or even predatory journals, but I suspect medical librarians reading this would have prefered it to correspond somehow to MEDLINE<strong> </strong>or the larger PubMed Se<strong>t </strong>(which is tricky, because I understand this isn&#8217;t strictly by journal, though one could imagine using OpenAlex records with PMIDs only) rather than trying to rate journals using their own criteria.</p><p>The other feature that is quite well hidden - is that you can upload papers to your search. I increasing see this feature in tools like scite assistant, Elicit, SciSpace but speaking as a librarian, I know publishers and content owners will be very unhappy with such usage of their content.</p><p></p><h2>LibKey Integration: A Small but Important Win</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!KCiD!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!KCiD!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png 424w, https://substackcdn.com/image/fetch/$s_!KCiD!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png 848w, https://substackcdn.com/image/fetch/$s_!KCiD!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png 1272w, https://substackcdn.com/image/fetch/$s_!KCiD!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!KCiD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png" width="915" height="433" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:433,&quot;width&quot;:915,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!KCiD!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png 424w, https://substackcdn.com/image/fetch/$s_!KCiD!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png 848w, https://substackcdn.com/image/fetch/$s_!KCiD!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png 1272w, https://substackcdn.com/image/fetch/$s_!KCiD!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe1d46d87-2fff-4717-ae6a-229ee25c3698_915x433.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>From a library point of view, one of the most practical features is <strong>LibKey integration</strong>.</p><p>Under Settings &#8594; Preferences, users can select their institution (e.g., &#8220;Singapore Management University&#8221;). Consensus then:</p><ul><li><p>Checks whether the paper is available via your holdings</p></li><li><p>Shows a small institutional icon next to records with accessible full text</p></li><li><p>Lets users click through via LibKey to the subscribed version</p></li></ul><p>Interestingly, among academic AI search tools, this kind of integration is still rarer than it should be. Consensus deserves credit here for supporting this.</p><p>Note that this doesn&#8217;t solve the full-text limitation for the AI itself&#8212;Deep Search cannot read paywalled content via LibKey&#8212;but it does significantly improve the user&#8217;s access experience.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!OHFd!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!OHFd!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png 424w, https://substackcdn.com/image/fetch/$s_!OHFd!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png 848w, https://substackcdn.com/image/fetch/$s_!OHFd!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png 1272w, https://substackcdn.com/image/fetch/$s_!OHFd!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!OHFd!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png" width="801" height="310" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:310,&quot;width&quot;:801,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!OHFd!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png 424w, https://substackcdn.com/image/fetch/$s_!OHFd!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png 848w, https://substackcdn.com/image/fetch/$s_!OHFd!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png 1272w, https://substackcdn.com/image/fetch/$s_!OHFd!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F940e6c37-db91-4dc2-84d6-fd749521b1ab_801x310.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>While Deep Search mode can use full-text (shown by the special document icon), this is strictly only for free papers and not related to your access via Libkey.</p><p>The only tool I know that actually uses institutional holdings directly in its own pipeline (without manual downloading/uploading) is <a href="https://support.elicit.com/en/articles/6123329">Elicit.com, via a browser extension.</a> </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!QNeu!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!QNeu!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png 424w, https://substackcdn.com/image/fetch/$s_!QNeu!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png 848w, https://substackcdn.com/image/fetch/$s_!QNeu!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png 1272w, https://substackcdn.com/image/fetch/$s_!QNeu!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!QNeu!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png" width="1253" height="639" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:639,&quot;width&quot;:1253,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:70126,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!QNeu!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png 424w, https://substackcdn.com/image/fetch/$s_!QNeu!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png 848w, https://substackcdn.com/image/fetch/$s_!QNeu!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png 1272w, https://substackcdn.com/image/fetch/$s_!QNeu!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1a6fa321-36d5-4d05-8e07-d2c334c4043d_1253x639.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><h2>Deep Search: Consensus&#8217;s Answer to Deep Research</h2><p><a href="https://library.smu.edu.sg/topics-insights/deep-research-literature-tools-what-are-they-and-how-are-they-different">&#8220;Deep Research&#8221; is becoming a distinct product category</a>: agentic AI workflows that spend 10+ minutes iterating through queries, following citations, and synthesising long-form reports. We see general-purpose versions (OpenAI Deep Research, Gemini Deep Research) and academic-specific ones (<a href="http://undermind.ai">Undermind.ai</a>, <a href="https://blog.scopus.com/accelerate-your-workflow-with-deep-research-a-new-scopus-ai-feature/">Scopus Deep Researc</a>h, <a href="https://asta.allen.ai/">AI2&#8217;s ASTA</a> and <a href="https://musingsaboutlibrarianship.blogspot.com/p/list-of-academic-search-engines-that.html#:~:text=List%20of%20academic,paragraphs).%20See%20more">more</a>.).</p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;7ce41912-1f28-4cf8-b740-7691d2ad159b&quot;,&quot;caption&quot;:&quot;&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;lg&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Why I Think Academic Deep Research &#8212; or at Least Deep Search &#8212; Will &#8220;Win&#8221; &quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:10210801,&quot;name&quot;:&quot;Aaron Tay&quot;,&quot;bio&quot;:&quot;I'm librarian + blogger from Singapore Management University. Social media, bibliometrics, analytics, library tech. Here to learn from experts, not an expert.&quot;,&quot;photo_url&quot;:&quot;https://substackcdn.com/image/fetch/f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fbucketeer-e05bbc84-baa3-437e-9518-adb32be77984.s3.amazonaws.com%2Fpublic%2Fimages%2Ff39219af-fee4-4db6-a3e1-47bb76350df6_314x280.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2025-08-08T10:28:15.521Z&quot;,&quot;cover_image&quot;:&quot;https://substackcdn.com/image/youtube/w_728,c_limit/-xjnS8O6YZY&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://aarontay.substack.com/p/why-i-think-academic-deep-research&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:169736667,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:11,&quot;comment_count&quot;:3,&quot;publication_id&quot;:267832,&quot;publication_name&quot;:&quot;Aaron Tay's Musings about Librarianship&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!SIBS!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdabe20d0-c305-4694-b04d-13176319efee_440x440.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div><p></p><p>Consensus Deep Search, introduced fairly recently, is its entry in this space. It is broadly comparable to Undermind.ai and, to a lesser extent, Elicit&#8217;s &#8220;Research Report&#8221; / systematic review flows. Both Undermind and Consensus typically finish in under 10 minutes; in my experience, Consensus is slightly faster.</p><blockquote><p>Why do the &#8220;deep&#8221; features of specialised tools like Undermind, Consensus, Elicit.com tend to work faster than generic Deep Research from OpenAI, Gemini etc and yet search as deeply if not more so?  Part of the reason, is that the later tends to search by &#8220;computer use&#8221; - it loads up a web browser and browses the web like a human. This is of course much slower than direct access via APIs or local lookups done by Undermind, Consensus, Elicit. On the other hand, access to just indexed academic content has blind spots of course.</p></blockquote><p></p><p>Key behavioural differences:</p><ul><li><p><strong>Consensus Deep Search</strong>: runs immediately, no clarifying questions</p></li><li><p><strong>Undermind</strong>: asks several clarifying questions before searching</p></li></ul><p>Some users find Undermind&#8217;s questions annoying; others (myself included) think they meaningfully improve search quality when you&#8217;re new to an area.</p><p>That said, some librarians dislike the fact that Undermind&#8217;s search process is 100% non transparent. Consensus Deep Search while not 100% transparent, at least shows more of its search process compared to Undermind.ai which is fully blackbox.</p><p>Search Process Transparency</p><p>Unlike Undermind.ai, which provides virtually no insight into its search process, Consensus Deep Search generates a PRISMA-like flow diagram:</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!19cA!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!19cA!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png 424w, https://substackcdn.com/image/fetch/$s_!19cA!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png 848w, https://substackcdn.com/image/fetch/$s_!19cA!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png 1272w, https://substackcdn.com/image/fetch/$s_!19cA!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!19cA!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png" width="1456" height="680" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/976b2e10-0035-4421-9948-d433d2034848_1698x793.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:680,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!19cA!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png 424w, https://substackcdn.com/image/fetch/$s_!19cA!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png 848w, https://substackcdn.com/image/fetch/$s_!19cA!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png 1272w, https://substackcdn.com/image/fetch/$s_!19cA!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F976b2e10-0035-4421-9948-d433d2034848_1698x793.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><em>Deep Search flow diagram showing search process</em></p><p>In this example, Deep Search:</p><ol><li><p>Ran 20 queries &#8594; 1,004 hits</p></li><li><p>Performed citation searching &#8594; 43 additional papers</p></li><li><p>Total hits: 1,047</p></li><li><p>Removed papers without abstracts and duplicates (-333) &#8594; 714 papers</p></li><li><p>Removed papers with &#8220;low semantic relevance&#8221; (-141) &#8594; 573 papers</p></li><li><p>Selected top 50 papers (after reranking)</p></li></ol><p>The sidebar provides even more detail. You can click on each section to see the actual queries executed:</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!pfOj!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!pfOj!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png 424w, https://substackcdn.com/image/fetch/$s_!pfOj!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png 848w, https://substackcdn.com/image/fetch/$s_!pfOj!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png 1272w, https://substackcdn.com/image/fetch/$s_!pfOj!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!pfOj!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png" width="506" height="641" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:641,&quot;width&quot;:506,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!pfOj!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png 424w, https://substackcdn.com/image/fetch/$s_!pfOj!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png 848w, https://substackcdn.com/image/fetch/$s_!pfOj!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png 1272w, https://substackcdn.com/image/fetch/$s_!pfOj!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F468fe3fd-1009-4704-914a-cc67f6281c7e_506x641.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>You can even see the criteria used for citation searching. This level of transparency is valuable for users who need to understand and potentially document their search strategy.</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!CEXc!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!CEXc!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png 424w, https://substackcdn.com/image/fetch/$s_!CEXc!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png 848w, https://substackcdn.com/image/fetch/$s_!CEXc!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png 1272w, https://substackcdn.com/image/fetch/$s_!CEXc!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!CEXc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png" width="494" height="163" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:163,&quot;width&quot;:494,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!CEXc!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png 424w, https://substackcdn.com/image/fetch/$s_!CEXc!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png 848w, https://substackcdn.com/image/fetch/$s_!CEXc!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png 1272w, https://substackcdn.com/image/fetch/$s_!CEXc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd7c88129-0548-48eb-892d-3cf69c2f451f_494x163.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><h2></h2><h3>Reproducibility and Explainability Concerns</h3><p>However, if you put on the evidence synthesis researcher hat, even this level of transparency which is high for these types of tools is of course not enough.</p><p><strong>1. Can searches be reproduced?</strong> The queries are displayed, but can another researcher run the exact same querie above and produce the same 1,047 hits and the same top 50 assuming no index change?</p><p><a href="https://thinkingmachines.ai/blog/defeating-nondeterminism-in-llm-inference/">LLM-based systems are often non-deterministic, even at temperature </a>0. In my informal tests, repeated Deep Search runs on the same question minutes apart gave slightly different rankings, though the top 10&#8211;20 papers tended to overlap strongly. </p><blockquote><p>There is an interesting hypothesis (which <a href="https://www.undermind.ai/whitepaper.pdf">Undermind&#8217;s early white paper alludes to) that </a><strong><a href="https://www.undermind.ai/whitepaper.pdf">iterative deep search might converge</a></strong><a href="https://www.undermind.ai/whitepaper.pdf"> on a stable set of relevant papers once enough items have been evaluated. Their modelling suggests that after ~150&#8211;300 evaluated papers, you&#8217;ve probably seen 80&#8211;98% of the relevant ones</a>. If true (a big &#8220;if&#8221;), this implies we might not get reproducible search <em>steps</em>, but we might still converge on a nearly complete relevant set&#8212;similar in spirit to stopping rules in systematic reviews. This is fertile ground for empirical research. </p></blockquote><p><strong>2. Can the strategy be exported in a usable form?</strong> For systematic reviews, search strategies must be documented and shared. Can the Deep Search process be exported in a format suitable for methods sections?</p><p><strong>3. What about the &#8220;black box&#8221; reranking?</strong> We see 573 eligible papers narrowed to 50, but the reranking algorithm that makes these selections is not transparent. What if paper #51 was actually critical to your research question?</p><p>These are not deal-breakers, but they highlight that while Consensus is more transparent than Undermind, it&#8217;s still not meeting the standards of reproducibility required for formal systematic reviews. Like Undermind and the other tools in this class, it is best thought of as a sophisticated scoping or exploratory tool rather than a replacement for systematic review methodology.</p><h3>Consensus Deep Search Output and Visualizations</h3><p>Like many modern Deep Research tools, Consensus Deep Search provides a long form report with many interesting visualizations. See <a href="https://consensus.app/search/do-certain-personality-traits-influence-career-suc/BfDwg7NbR9yiazyefv4cuw/">sample report here</a>.</p><p><strong>Unique features</strong>:</p><ol><li><p><strong>Color-Coded Citations</strong>: In-text citations are colored  </p><ul><li><p>Green: &#8220;yes&#8221;</p></li><li><p>Yellow: &#8220;possibly&#8221;</p></li><li><p>Orange: &#8220;mixed&#8221;</p></li><li><p>Red: &#8220;no&#8221;<br>&#8230;based on Consensus Meter labels, with icons indicating whether title/abstract only or full text was used. </p></li></ul></li></ol><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!4Ie2!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!4Ie2!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png 424w, https://substackcdn.com/image/fetch/$s_!4Ie2!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png 848w, https://substackcdn.com/image/fetch/$s_!4Ie2!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png 1272w, https://substackcdn.com/image/fetch/$s_!4Ie2!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!4Ie2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png" width="888" height="659" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:659,&quot;width&quot;:888,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!4Ie2!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png 424w, https://substackcdn.com/image/fetch/$s_!4Ie2!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png 848w, https://substackcdn.com/image/fetch/$s_!4Ie2!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png 1272w, https://substackcdn.com/image/fetch/$s_!4Ie2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F68d4cd00-45ca-454a-966a-3e9f4b4e65ab_888x659.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p></p><ol start="2"><li><p><strong>Claims and Evidence Table</strong>: Structured extraction of key claims and the papers supporting or disputing them.</p></li></ol><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!8j_n!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!8j_n!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png 424w, https://substackcdn.com/image/fetch/$s_!8j_n!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png 848w, https://substackcdn.com/image/fetch/$s_!8j_n!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png 1272w, https://substackcdn.com/image/fetch/$s_!8j_n!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!8j_n!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png" width="647" height="848" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:848,&quot;width&quot;:647,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!8j_n!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png 424w, https://substackcdn.com/image/fetch/$s_!8j_n!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png 848w, https://substackcdn.com/image/fetch/$s_!8j_n!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png 1272w, https://substackcdn.com/image/fetch/$s_!8j_n!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffb3105cf-d121-40ab-b469-22a89cdc2a0d_647x848.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Other more common but still useful visualizations include </p><ol start="3"><li><p><strong>Results Timeline</strong>: Shows distribution of relevant papers over time&#8212;useful for identifying emerging trends or seminal early work.</p></li></ol><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Mm7B!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Mm7B!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png 424w, https://substackcdn.com/image/fetch/$s_!Mm7B!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png 848w, https://substackcdn.com/image/fetch/$s_!Mm7B!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png 1272w, https://substackcdn.com/image/fetch/$s_!Mm7B!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Mm7B!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png" width="887" height="435" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:435,&quot;width&quot;:887,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!Mm7B!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png 424w, https://substackcdn.com/image/fetch/$s_!Mm7B!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png 848w, https://substackcdn.com/image/fetch/$s_!Mm7B!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png 1272w, https://substackcdn.com/image/fetch/$s_!Mm7B!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F63c0c33a-3799-41a0-92cc-30b87397e967_887x435.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><ol start="4"><li><p><strong>Top Contributors, Research Gaps and Open Questions</strong></p></li></ol><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7crB!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7crB!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png 424w, https://substackcdn.com/image/fetch/$s_!7crB!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png 848w, https://substackcdn.com/image/fetch/$s_!7crB!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png 1272w, https://substackcdn.com/image/fetch/$s_!7crB!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7crB!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png" width="794" height="572" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:572,&quot;width&quot;:794,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:26367,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7crB!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png 424w, https://substackcdn.com/image/fetch/$s_!7crB!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png 848w, https://substackcdn.com/image/fetch/$s_!7crB!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png 1272w, https://substackcdn.com/image/fetch/$s_!7crB!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fea223c74-dc6c-47c8-8f35-3e009eb85212_794x572.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2> </h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!tPhT!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!tPhT!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png 424w, https://substackcdn.com/image/fetch/$s_!tPhT!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png 848w, https://substackcdn.com/image/fetch/$s_!tPhT!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png 1272w, https://substackcdn.com/image/fetch/$s_!tPhT!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!tPhT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png" width="876" height="429" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:429,&quot;width&quot;:876,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!tPhT!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png 424w, https://substackcdn.com/image/fetch/$s_!tPhT!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png 848w, https://substackcdn.com/image/fetch/$s_!tPhT!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png 1272w, https://substackcdn.com/image/fetch/$s_!tPhT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F887ce21a-dd38-4ec3-a7a1-3af11aff5dc1_876x429.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!WROF!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!WROF!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png 424w, https://substackcdn.com/image/fetch/$s_!WROF!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png 848w, https://substackcdn.com/image/fetch/$s_!WROF!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png 1272w, https://substackcdn.com/image/fetch/$s_!WROF!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!WROF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png" width="870" height="529" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:529,&quot;width&quot;:870,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;NA&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="NA" title="NA" srcset="https://substackcdn.com/image/fetch/$s_!WROF!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png 424w, https://substackcdn.com/image/fetch/$s_!WROF!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png 848w, https://substackcdn.com/image/fetch/$s_!WROF!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png 1272w, https://substackcdn.com/image/fetch/$s_!WROF!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60d02bff-88ba-4c38-992d-fd5d2438c1dc_870x529.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2>Search performance of Consensus</h2><p>All this is very nice. But at the end of the day, we should care mostly about retrieval. How well does it work?</p><p>I generally run a couple of quick and dirty tests (see <a href="https://katinamagazine.org/content/article/reviews/2025/deep-dive-into-three-ai-academic-search-tools">this to get a feel of how I test quickly</a>) to get a feel of how well the search works and Consensus in Deep Search mode aced my &#8220;easy&#8221;, &#8220;medium&#8221; and &#8220;hard&#8221; challenges.</p><p>This is expected for Deep Search tools but it is always good to confirm. </p><h2>Hallucination check</h2><p>In particular, it aced my &#8220;negative rejection&#8221; test <a href="https://doi.org/10.48550/arXiv.2309.01431">(Chen et al., 2023)</a>. </p><p>This involves posing a question where no relevant literature exists and see if the system:</p><ul><li><p>sensibly refuses to answer</p></li><li><p>hallucinates an answer with fake citations.</p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ZVVs!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ZVVs!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png 424w, https://substackcdn.com/image/fetch/$s_!ZVVs!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png 848w, https://substackcdn.com/image/fetch/$s_!ZVVs!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png 1272w, https://substackcdn.com/image/fetch/$s_!ZVVs!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ZVVs!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png" width="822" height="431" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:431,&quot;width&quot;:822,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:59575,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!ZVVs!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png 424w, https://substackcdn.com/image/fetch/$s_!ZVVs!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png 848w, https://substackcdn.com/image/fetch/$s_!ZVVs!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png 1272w, https://substackcdn.com/image/fetch/$s_!ZVVs!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F14af86a6-8c9a-40c2-9ba0-9dc6225a81ec_822x431.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p><a href="https://help.consensus.app/en/articles/10046838-responsible-ai-limitations#:~:text=regarding%20your%20question.-,Hallucinations%20can%20occur,-Hallucinations%20are%20a">Consensus claims to be immune to hallucinations that involve </a><strong><a href="https://help.consensus.app/en/articles/10046838-responsible-ai-limitations#:~:text=regarding%20your%20question.-,Hallucinations%20can%20occur,-Hallucinations%20are%20a">non-existent references</a></strong>, and not to answer from &#8220;internal memory&#8221; without sources. In my testing, it did indeed refuse where it should.</p><p> But it might still &#8220;misread sources&#8221; or what some papers call fail on &#8220;source faithfulness&#8221;.</p><p>Don&#8217;t be too impressed though; most properly implemented academic RAG systems with additional checks can easily guarantee the first (just check if generated cited references match what is in the index using non-LLM methods), and often the second. It is the third type of hallucination that is always the issue.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!UcUx!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!UcUx!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png 424w, https://substackcdn.com/image/fetch/$s_!UcUx!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png 848w, https://substackcdn.com/image/fetch/$s_!UcUx!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png 1272w, https://substackcdn.com/image/fetch/$s_!UcUx!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!UcUx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png" width="984" height="440" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:440,&quot;width&quot;:984,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:51939,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!UcUx!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png 424w, https://substackcdn.com/image/fetch/$s_!UcUx!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png 848w, https://substackcdn.com/image/fetch/$s_!UcUx!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png 1272w, https://substackcdn.com/image/fetch/$s_!UcUx!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F730ef341-0e11-4ed3-b5a2-f2782a142a47_984x440.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Deep Search tools are so good now that they easily ace my tests, but my rough estimation/vibe sense currently is that the Consensus Deep Search is at least decent (maybe in the top quartile of tools I have tried), though it is unclear how it stacks up against my favourite tool, Undermind.ai, which is generally ranked at the top of the table in many properly and not so properly done head-to-head tests and/or is praised by evidence synthesis experts I know.</p><p></p><h2>Conclusion</h2><p>Consensus is in my view, likely one of the top tools in its class.</p><p>First and most importantly, the recent addition of Deep Search mode, makes the retrieval capabilities of Consensus competitive with some of the most powerful search tools.</p><p>On top of that, it has in my view one of the most appealing interfaces out there, with color-coded references, and the Consensus Meter, for all its methodological faults, is likely to appeal to undergraduates and less advanced users - allowing them to get a quick scan of the literature. Add advanced pre-filters and LibKey integration to institutional full-text, and it is easy to guess this will be a hit for many users doing narrative literature reviews.</p><p>Still, I have some misgivings over how STEM centric some parts of Consensus are, for example there&#8217;s it&#8217;s use of SciScore, details extracted for study snapshots etc. While the sources are broad enough, one wonders if the tool works better (e.g. retrieval and ranking algo is tuned) for STEM subjects.</p><p>Overall, while there are perhaps more powerful and specialized tools like Undermind.ai or Elicit.com, this is a great tool, that I can recommend considering for institutions.</p><p><a href="https://aarontay.substack.com/about#&#167;disclosure-and-independence-policy">My Disclosure &amp; Independence Policy</a></p><h2>Bonus : Comparison: Consensus vs. Undermind.ai</h2><p>Since SMU Libraries currently subscribes to both tools, it would be good to do a comparison. Do note that I have a lot more experience with Undermind.ai and the purpose of this piece isn&#8217;t to do a formal comparison review.</p><h3>Similarities</h3><ul><li><p>Both search approximately the same open sources (OpenAlex, Semantic Scholar) using a mix of lexical, semantic and even citation search (in Consensus Deep mode).</p></li><li><p>Both take &lt;10 minutes for deep research runs (Undermind takes slightly longer)</p></li><li><p>Both generate comprehensive reports and interesting visualizations with citations</p></li><li><p>Both use sophisticated LLM-based summarization and extraction</p></li></ul><p></p><h3>Key Differences between Consensus and Undermind </h3><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!RbeZ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!RbeZ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png 424w, https://substackcdn.com/image/fetch/$s_!RbeZ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png 848w, https://substackcdn.com/image/fetch/$s_!RbeZ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png 1272w, https://substackcdn.com/image/fetch/$s_!RbeZ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!RbeZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png" width="561" height="741" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:741,&quot;width&quot;:561,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:43946,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!RbeZ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png 424w, https://substackcdn.com/image/fetch/$s_!RbeZ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png 848w, https://substackcdn.com/image/fetch/$s_!RbeZ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png 1272w, https://substackcdn.com/image/fetch/$s_!RbeZ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F2377ce02-82a1-4061-b50e-082ba2297ffd_561x741.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>I had initially planned an in-depth comparison of Undermind vs Consensus, but it ran too long and makes little sense if you are not already familiar with Undermind.ai.</p><p>Still, here&#8217;s how I see how the two differ.</p><p><strong>Layout Format Differences</strong></p><p>One of the most noticeable differences between Consensus and Undermind is their report format. Consensus generates long-form prose reports with extensive tables and visualizations that can theoretically be copied directly into a document.</p><p>Undermind, by contrast, diverges from the usual Deep Research outputs and produces more informal reports organized in bullet points across standard sections.</p><p>There&#8217;s usually an initial summary section, then sections titled</p><ul><li><p>Categories</p></li><li><p>Timeline</p></li><li><p>Foundational Work</p></li><li><p>Adjacent Work  (work that cites foundational work a lot but Undermind determines is not semantically what you want - read to get broader view).</p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ej3w!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ej3w!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png 424w, https://substackcdn.com/image/fetch/$s_!ej3w!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png 848w, https://substackcdn.com/image/fetch/$s_!ej3w!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png 1272w, https://substackcdn.com/image/fetch/$s_!ej3w!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ej3w!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png" width="538" height="829" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/55463281-2a71-4266-9aac-a3f6995e0979_538x829.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:829,&quot;width&quot;:538,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:55382,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ej3w!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png 424w, https://substackcdn.com/image/fetch/$s_!ej3w!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png 848w, https://substackcdn.com/image/fetch/$s_!ej3w!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png 1272w, https://substackcdn.com/image/fetch/$s_!ej3w!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F55463281-2a71-4266-9aac-a3f6995e0979_538x829.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p> </p><p><a href="https://app.undermind.ai/report/7b268fa2277b49f6ec45c689fcd1f43a48ba88db48b43134c58804dda396e10e">Here&#8217;s an example</a> with some sections expanded. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!fDga!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!fDga!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png 424w, https://substackcdn.com/image/fetch/$s_!fDga!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png 848w, https://substackcdn.com/image/fetch/$s_!fDga!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png 1272w, https://substackcdn.com/image/fetch/$s_!fDga!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!fDga!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png" width="725" height="733" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:733,&quot;width&quot;:725,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!fDga!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png 424w, https://substackcdn.com/image/fetch/$s_!fDga!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png 848w, https://substackcdn.com/image/fetch/$s_!fDga!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png 1272w, https://substackcdn.com/image/fetch/$s_!fDga!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffda9cdfc-b02c-43d6-b0f7-e052bf024b29_725x733.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!go4Y!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!go4Y!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png 424w, https://substackcdn.com/image/fetch/$s_!go4Y!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png 848w, https://substackcdn.com/image/fetch/$s_!go4Y!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png 1272w, https://substackcdn.com/image/fetch/$s_!go4Y!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!go4Y!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png" width="532" height="523" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:523,&quot;width&quot;:532,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:31841,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:&quot;&quot;,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!go4Y!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png 424w, https://substackcdn.com/image/fetch/$s_!go4Y!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png 848w, https://substackcdn.com/image/fetch/$s_!go4Y!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png 1272w, https://substackcdn.com/image/fetch/$s_!go4Y!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1ebc70c5-6bfe-4815-ad72-8c5e2daa8458_532x523.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Besides the standard sections in Undermind, the subsections under it are more variable but typically you will see coverage of areas like &#8220;research gap&#8221;, &#8220;cluster of top authors&#8221; etc, pretty much what you see in Scopus AI, Consensus Deep Search etc.</p><p>That said, Consensus provides substantially more built-in visualizations. In fact, the one major visualization you can see in Undermind is the timeline visualization and the rest are tables at best.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!gcC1!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!gcC1!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png 424w, https://substackcdn.com/image/fetch/$s_!gcC1!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png 848w, https://substackcdn.com/image/fetch/$s_!gcC1!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png 1272w, https://substackcdn.com/image/fetch/$s_!gcC1!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!gcC1!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png" width="1456" height="760" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/b36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:760,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!gcC1!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png 424w, https://substackcdn.com/image/fetch/$s_!gcC1!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png 848w, https://substackcdn.com/image/fetch/$s_!gcC1!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png 1272w, https://substackcdn.com/image/fetch/$s_!gcC1!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fb36257f1-f07b-4c62-a0e8-5b51721e8248_1542x805.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>But what about sections you want but Undermind doesn&#8217;t generate? Undermind covers this with a &#8220;Chat with Expert.&#8221; feature, This functionality allows users to interact with all the papers found using a frontier thinking model (the specific LLM is not disclosed). </p><blockquote><p>Most other similar tools like Consensus, SciSpace offer &#8220;chat with paper&#8221; but this only interacts with one or at best a few papers.</p></blockquote><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!87Vd!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!87Vd!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png 424w, https://substackcdn.com/image/fetch/$s_!87Vd!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png 848w, https://substackcdn.com/image/fetch/$s_!87Vd!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png 1272w, https://substackcdn.com/image/fetch/$s_!87Vd!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!87Vd!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png" width="694" height="436" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:436,&quot;width&quot;:694,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!87Vd!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png 424w, https://substackcdn.com/image/fetch/$s_!87Vd!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png 848w, https://substackcdn.com/image/fetch/$s_!87Vd!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png 1272w, https://substackcdn.com/image/fetch/$s_!87Vd!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F9228f52f-9815-4d59-ab44-497f36702d5c_694x436.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>You can type in your own prompt but by default it includes nine prompts that are surely well-engineered to work effectively with Undermind, and in my experience, these prompts can generate outputs matching or exceeding what Consensus produces automatically, including equivalents to Consensus&#8217;s &#8220;Claims and Evidence Table.&#8221; </p><p>This is what you might get when you ask to compare top findings.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!MQFM!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!MQFM!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png 424w, https://substackcdn.com/image/fetch/$s_!MQFM!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png 848w, https://substackcdn.com/image/fetch/$s_!MQFM!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png 1272w, https://substackcdn.com/image/fetch/$s_!MQFM!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!MQFM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png" width="1456" height="636" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/27e0b472-33c0-4469-a9dc-448897710657_1766x772.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:636,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:100422,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/178770843?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!MQFM!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png 424w, https://substackcdn.com/image/fetch/$s_!MQFM!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png 848w, https://substackcdn.com/image/fetch/$s_!MQFM!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png 1272w, https://substackcdn.com/image/fetch/$s_!MQFM!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F27e0b472-33c0-4469-a9dc-448897710657_1766x772.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Interestingly, earlier versions of this feature would independently search the web when using default prompts to supplement academic sources with government reports and policy documents. It almost never does this now,<em> but you can turn this on by explicitly adding &#8220;Search the web&#8221; to the default prompts.</em>  As you can see below, the LLM is searching the general web for general US policy on open access.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!KrSW!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!KrSW!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png 424w, https://substackcdn.com/image/fetch/$s_!KrSW!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png 848w, https://substackcdn.com/image/fetch/$s_!KrSW!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png 1272w, https://substackcdn.com/image/fetch/$s_!KrSW!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!KrSW!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png" width="884" height="684" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/df2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:684,&quot;width&quot;:884,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!KrSW!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png 424w, https://substackcdn.com/image/fetch/$s_!KrSW!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png 848w, https://substackcdn.com/image/fetch/$s_!KrSW!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png 1272w, https://substackcdn.com/image/fetch/$s_!KrSW!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdf2e137d-2480-488b-a0aa-2491abcbfa14_884x684.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>When activated, it can cite both academic references and current policy documents, providing a broader evidence base than purely academic sources.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!jGPy!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!jGPy!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png 424w, https://substackcdn.com/image/fetch/$s_!jGPy!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png 848w, https://substackcdn.com/image/fetch/$s_!jGPy!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png 1272w, https://substackcdn.com/image/fetch/$s_!jGPy!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!jGPy!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png" width="982" height="581" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:581,&quot;width&quot;:982,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!jGPy!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png 424w, https://substackcdn.com/image/fetch/$s_!jGPy!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png 848w, https://substackcdn.com/image/fetch/$s_!jGPy!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png 1272w, https://substackcdn.com/image/fetch/$s_!jGPy!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F105bbe03-b90f-4be0-b4b8-7edf49834163_982x581.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>As you can see above, the output cites the latest 2025 US policy (dated March 2025) and not just the academic references found earlier.</p><p><strong>User Visualizations and Interface</strong></p><p>From a user experience perspective, Consensus appears more accessible to less advanced users. The Consensus Meter, despite its methodological limitations, provides an intuitive visualization that appeals to many users. The color-coding of citations makes it easy to see at a glance which papers support different conclusions, and the built-in visualizations require no additional prompting or effort. Small but practical features like LibKey integration for accessing full-text articles are particularly valuable for undergraduate students who may not have established workflows for accessing institutional subscriptions.</p><p><strong>Undermind has more advanced search capabilities </strong></p><p>Despite these user-friendly features, I personally prefer Undermind, primarily for its search capabilities. While Undermind&#8217;s clarifying questions before conducting searches can sometimes feel tiresome, they prove extremely helpful when exploring unfamiliar research areas&#8212;which represents the most common use case for these tools. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!WHgP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!WHgP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png 424w, https://substackcdn.com/image/fetch/$s_!WHgP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png 848w, https://substackcdn.com/image/fetch/$s_!WHgP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png 1272w, https://substackcdn.com/image/fetch/$s_!WHgP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!WHgP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png" width="841" height="756" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:756,&quot;width&quot;:841,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!WHgP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png 424w, https://substackcdn.com/image/fetch/$s_!WHgP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png 848w, https://substackcdn.com/image/fetch/$s_!WHgP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png 1272w, https://substackcdn.com/image/fetch/$s_!WHgP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F4670bcf8-52bc-444a-9ab2-fe2338cb8a0c_841x756.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>There are hints that Undermind employs a more sophisticated search system: it evaluates approximately 150 results on average compared to Consensus&#8217;s maximum of 50, and it can search even deeper when requested. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!0_z6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!0_z6!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png 424w, https://substackcdn.com/image/fetch/$s_!0_z6!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png 848w, https://substackcdn.com/image/fetch/$s_!0_z6!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png 1272w, https://substackcdn.com/image/fetch/$s_!0_z6!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!0_z6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png" width="635" height="249" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/de788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:249,&quot;width&quot;:635,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!0_z6!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png 424w, https://substackcdn.com/image/fetch/$s_!0_z6!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png 848w, https://substackcdn.com/image/fetch/$s_!0_z6!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png 1272w, https://substackcdn.com/image/fetch/$s_!0_z6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde788bc9-12ed-46bb-a00e-a6e429de779e_635x249.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Undermind also provides a statistical analysis estimating how much relevant literature might remain undiscovered, though this feature lacks independent validation. </p><p>Another valuable feature is Undermind&#8217;s search alerts based on created reports, which the author finds extremely high-quality and useful, including &#8220;adjacent&#8221; alerts that surface related but not directly requested content&#8212;something Consensus doesn&#8217;t currently offer.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!W4II!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!W4II!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png 424w, https://substackcdn.com/image/fetch/$s_!W4II!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png 848w, https://substackcdn.com/image/fetch/$s_!W4II!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png 1272w, https://substackcdn.com/image/fetch/$s_!W4II!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!W4II!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png" width="1415" height="893" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:893,&quot;width&quot;:1415,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!W4II!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png 424w, https://substackcdn.com/image/fetch/$s_!W4II!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png 848w, https://substackcdn.com/image/fetch/$s_!W4II!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png 1272w, https://substackcdn.com/image/fetch/$s_!W4II!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F53794818-f145-4a78-bb8d-e66a41b37f28_1415x893.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The one area regarding search where Consensus maintains a clear search advantage is its extensive pre-filtering options, allowing users to exclude preprints or filter by journal quality thresholds before conducting searches.</p><h2>Conclusion</h2><p>For my typical use case&#8212;<a href="https://aarontay.substack.com/p/what-academic-deep-research-is-really">quickly getting the lay of the land rather than producing ready-to-use literature review text&#8212;</a>both tools work well, with a slight preference for Undermind&#8217;s bullet-point format for easier skimming. </p><p>Both are excellent tools - typically mentioned in the same breath as Elicit.com, I suspect the choice between tools ultimately depends on the user&#8217;s sophistication and whether one prioritizes accessible visualizations or deeper search capabilities - with Consensus being easier to appreciate for undergraduates and less advanced users, while advanced users would appreciate the deeper search capabilities of Undermind.ai.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div>]]></content:encoded></item><item><title><![CDATA[ResearchRabbit’s 2025 Revamp: iterative chaining without the clutter]]></title><description><![CDATA[ResearchRabbit shipped its biggest update in years: a cleaner iterative &#8220;rabbit hole&#8221; flow, a more configurable citation graph, and an optional premium tier.The company now &#8220;partners&#8217; with Litmaps, which shows up in features and business model]]></description><link>https://aarontay.substack.com/p/researchrabbits-2025-revamp-iterative</link><guid isPermaLink="false">https://aarontay.substack.com/p/researchrabbits-2025-revamp-iterative</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Sun, 02 Nov 2025 13:11:28 GMT</pubDate><enclosure url="https://substackcdn.com/image/youtube/w_728,c_limit/St4C-QdU-Ro" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div id="youtube2-St4C-QdU-Ro" class="youtube-wrap" data-attrs="{&quot;videoId&quot;:&quot;St4C-QdU-Ro&quot;,&quot;startTime&quot;:null,&quot;endTime&quot;:null}" data-component-name="Youtube2ToDOM"><div class="youtube-inner"><iframe src="https://www.youtube-nocookie.com/embed/St4C-QdU-Ro?rel=0&amp;autoplay=0&amp;showinfo=0&amp;enablejsapi=0" frameborder="0" loading="lazy" gesture="media" allow="autoplay; fullscreen" allowautoplay="true" allowfullscreen="true" width="728" height="409"></iframe></div></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee! (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee! (via ko-fi)</span></a></p><p><strong>TL;DR  </strong></p><ul><li><p>ResearchRabbit shipped its biggest update in years: a cleaner iterative &#8220;rabbit hole&#8221; flow, a more configurable citation graph, and an optional premium tier.</p></li><li><p>The company now &#8220;<strong>partners&#8217; with Litmaps (others are reporting as <a href="https://www.scoop.co.nz/stories/BU2505/S00127/nz-startup-litmaps-acquires-us-rival-and-raises-1m-to-accelerate-ai-driven-research-worldwide.htm">acquired</a></strong>, which shows up in features and business model</p></li><li><p>Free tier limits each search to <strong>&lt;50 input papers / &lt;5 authors</strong> and one project; RR+ removes those caps and unlocks unlimited advanced searches and exports.</p></li><li><p>For librarians and researchers: IMHO RR is now a user friendly entry to <strong>iterative citation chaining</strong>; Litmaps still leads on <strong>advanced visualization/filters methods</strong>; Connected Papers remains the <strong>fastest and easiest to use &#8220;single-seed&#8221; map</strong>.</p></li></ul><p></p><p><strong>Introduction</strong></p><p>ResearchRabbit belongs to a category of tools I call <a href="https://musingsaboutlibrarianship.blogspot.com/2022/08/citation-based-literature-mapping-tools.html">&#8220;citation-based literature mapping.&#8221;</a> This group includes <a href="https://www.citationgecko.com/">Citation Gecko</a>, <a href="https://www.connectedpapers.com/">Connected Papers</a>, <a href="https://researchrabbitapp.com/">Research Rabbit</a>, <a href="https://inciteful.xyz/">Inciteful</a>, <a href="https://www.litmaps.com/">Litmaps</a> and <a href="https://musingsaboutlibrarianship.blogspot.com/p/list-of-innovative-literature-mapping.html">others</a>. Most of these tools, with the exception of the early pioneer Citation Gecko, only emerged in the early 2020s (prior to ChatGPT craze).</p><p>These tools came from a variety of sources, from startups to open source hobbyist projects by researchers. This explosion of ideas and tools became possible <a href="https://opencitations.wordpress.com/2021/10/27/coverage-of-open-citation-data-approaches-parity-with-web-of-science-and-scopus/">thanks to the availability of large-scale open academic metadata</a>&#8212;such as OpenAlex and the Semantic Scholar Corpus&#8212;under open licenses. These resources now rival or even exceed traditional citation indexes like Web of Science in coverage.</p><blockquote><p>Though I have noted, with <a href="https://aarontay.substack.com/p/the-petrol-tank-for-ai-discovery">content owners and publishers are now cracking down on the use of abtracts due to the increased value for training by Big tech companies</a>, things might be reversing.</p></blockquote><p>I use the term &#8220;<a href="https://musingsaboutlibrarianship.blogspot.com/2022/08/citation-based-literature-mapping-tools.html">citation-based literature mappin</a>g services or tools&#8221; because, traditionally, most of these tools rely solely on citations for recommendations and clustering. They generally predate the post-2023 rise of &#8220;AI-powered search engines&#8221; and thus typically don&#8217;t employ Transformer-based LLM methods for recommendations. While some of the latest Litmaps features *do* incorporate generative AI to do semantic matching, this is a very recent development. </p><blockquote><p>It&#8217;s challenging to be 100% certain about their underlying algorithms, as tools are not always transparent on how they work. However, we do know that Litmaps utilizes &#8220;semantic search&#8221; (<a href="https://medium.com/litmaps/guide-to-litmaps-visualisations-95a9bc2cc9de">dense embedding search - SPECTER embeddings as of 2021</a>) for title-abstract similarity matching, and it&#8217;s probable the new ResearchRabbit does as well with the &#8220;similar&#8221; function.</p></blockquote><p>Among these tools, I&#8217;ve always considered ResearchRabbit one of the &#8220;big three,&#8221; alongside Connected Papers and Litmaps. While other similar offerings exist, most are hobbyist projects; these three appear the most ambitious, offering feature-rich interfaces and generally being the most well-known among users, including librarians. </p><p>ResearchRabbit particularly stood out for librarians to recommend because, despite its interface brimming with features (matched only by Litmaps), it didn&#8217;t offer a premium tier. </p><p>I&#8217;ve always wondered about how they would remain sustainable, and now we have an answer. <a href="https://www.researchrabbit.ai/announcement-researchrabbit-release-2025">On October 15, 2025, they announced that the new version of ResearchRabbit would include premium features</a>. Even more interestingly, they also revealed a partnership (reported as<a href="https://www.scoop.co.nz/stories/BU2505/S00127/nz-startup-litmaps-acquires-us-rival-and-raises-1m-to-accelerate-ai-driven-research-worldwide.htm"> acquisition by some</a>) with Litmaps!</p><p><a href="https://x.com/RsrchRabbit/status/1983825922131218668">On October 30, 2025, the new ResearchRabbit officially launched</a>. <br> </p><h2>What changed and not changed</h2><p><strong>Not changed</strong> - You enter &#8220;Seed Papers&#8221; which are used by ResearchRabbit to recommend papers.</p><p><strong>Changed - </strong>Besides using citations, references or authors of seed papers, you can use semantic similarity (likely based on title/abstract similarity embeddings like Litmaps)</p><p><strong>Changed - </strong>New Citation Map visualization with customizable X,Y Axis (similar to Litmaps)</p><p><strong>Changed</strong> - New cleaner interface around &#8220;Rabbit hole&#8217; metaphor.</p><h2>The new &#8220;Rabbit-hole&#8221; interface explained</h2><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!xD0C!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!xD0C!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png 424w, https://substackcdn.com/image/fetch/$s_!xD0C!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png 848w, https://substackcdn.com/image/fetch/$s_!xD0C!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png 1272w, https://substackcdn.com/image/fetch/$s_!xD0C!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!xD0C!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png" width="433" height="122" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:122,&quot;width&quot;:433,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:12727,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!xD0C!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png 424w, https://substackcdn.com/image/fetch/$s_!xD0C!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png 848w, https://substackcdn.com/image/fetch/$s_!xD0C!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png 1272w, https://substackcdn.com/image/fetch/$s_!xD0C!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd34f803e-58e1-4219-8346-c873ed7e8c6c_433x122.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>The part that confused the most about the new interface was this &#8220;Rabbit Hole&#8221; interface that appeared at the top of the interface. After a lot of experimentation, this is my understanding of how it works.</p><p>Think of ResearchRabbit&#8217;s &#8220;rabbit holes&#8221; as a tidy history of your search <strong>checkpoints</strong>, The tricky bit is to understand what actions create a &#8220;rabbit hole&#8221; checkpoint and what doesn&#8217;t.<br></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p>Here is how <em>I think of it. </em>Several moving parts matter: <strong>input set</strong>, <strong>mode</strong>, and <strong>iteration</strong>.  These terms are my own invention.</p><h2>The three moving parts</h2><ul><li><p><strong>Collection</strong> : This is your folder of papers that persist across session. You can create multiple color-coded collections. Any seed papers or input papers you find during the session are not automatically added to your collection unless you explicitly add them.</p></li><li><p><strong>Seeds</strong>: the first few papers you use as the <strong>1st iteration of search</strong>. This can be from your collection, found via search or uploaded via CSV/BibTeX etc.</p></li><li><p><strong>Input set</strong>: the seeds plus any candidates you actively select during the process to guide the <em>next iterations of search</em>.</p></li><li><p><strong>Mode</strong>: the method you use to fetch candidates based on <strong>last iteration input papers</strong> for review:</p><ul><li><p><strong>Similar</strong> &#8212; based on semantic/title-abstract similarity of input papers</p></li><li><p><strong>References</strong> &#8212; based on backward links (papers the inputs cite)</p></li><li><p><strong>Citations</strong> &#8212; based on forward links (papers that cite the inputs)</p></li><li><p>There is <strong>author search</strong> but I rarely use it.</p></li><li><p>These actions <strong>do not</strong> create a &#8220;rabbit hole&#8221; checkpoint</p></li></ul></li></ul><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!H-6j!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!H-6j!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png 424w, https://substackcdn.com/image/fetch/$s_!H-6j!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png 848w, https://substackcdn.com/image/fetch/$s_!H-6j!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png 1272w, https://substackcdn.com/image/fetch/$s_!H-6j!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!H-6j!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png" width="609" height="315" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:315,&quot;width&quot;:609,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:65477,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!H-6j!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png 424w, https://substackcdn.com/image/fetch/$s_!H-6j!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png 848w, https://substackcdn.com/image/fetch/$s_!H-6j!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png 1272w, https://substackcdn.com/image/fetch/$s_!H-6j!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60230654-74b5-41d9-baf0-e77e4a8bee1f_609x315.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><ul><li><p>Only clicking search on the bottom right creates the next search iteration</p></li></ul><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!GrYH!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!GrYH!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png 424w, https://substackcdn.com/image/fetch/$s_!GrYH!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png 848w, https://substackcdn.com/image/fetch/$s_!GrYH!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png 1272w, https://substackcdn.com/image/fetch/$s_!GrYH!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!GrYH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png" width="448" height="760" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:760,&quot;width&quot;:448,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:94213,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!GrYH!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png 424w, https://substackcdn.com/image/fetch/$s_!GrYH!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png 848w, https://substackcdn.com/image/fetch/$s_!GrYH!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png 1272w, https://substackcdn.com/image/fetch/$s_!GrYH!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd3ff17e7-0628-45e4-b722-c7a7d5af48e9_448x760.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>For example,</p><ul><li><p>I started off with 2 seed papers (1st iteration), and these 2 seed papers recommended papers based on &#8220;similarity&#8221; </p></li><li><p>I added 3 of them as input papers, I then switched mode to using &#8220;references&#8220; and ResearchRabbit will recommend other papers based on the 2 seed papers (not the 3 just added input papers)</p></li><li><p>I added 1 of them from the new model as input paper</p></li><li><p>Now I have 2+3+1 = 6 input papers which I can use to search as<em> the next iteration</em> using similarity'/references/citations </p></li><li><p>ResearchRabbit now recommends a list of similar papers based on 6 input papers (2nd iteration) and I can add more input papers, switch to using references/citations of these 6 papers etc.</p><p></p></li></ul><h2>What actually creates a &#8220;rabbit hole&#8221; (iteration)</h2><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!zgjU!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!zgjU!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png 424w, https://substackcdn.com/image/fetch/$s_!zgjU!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png 848w, https://substackcdn.com/image/fetch/$s_!zgjU!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png 1272w, https://substackcdn.com/image/fetch/$s_!zgjU!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!zgjU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png" width="400" height="458" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:458,&quot;width&quot;:400,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:62446,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!zgjU!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png 424w, https://substackcdn.com/image/fetch/$s_!zgjU!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png 848w, https://substackcdn.com/image/fetch/$s_!zgjU!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png 1272w, https://substackcdn.com/image/fetch/$s_!zgjU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3f78295f-c56c-4c51-9e9a-a274034f05e5_400x458.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><ul><li><p><strong>Creates an iteration:</strong> clicking <strong>Search</strong> with the current <strong>input set</strong>.</p></li><li><p><strong>Does not create an iteration:</strong> switching <strong>Similar / References / Citations</strong>, changing axes or node sizes, or saving items to a <strong>collection</strong>.</p></li></ul><blockquote><p>Mental model: <strong>Mode = lens</strong> (changes what you <em>see with the <strong>last</strong> <strong>iteration input set</strong></em>). <strong>Iteration = checkpoint</strong> (records your step). <strong>Branch = fork</strong> (a new line of checkpoints starting from an earlier one).</p></blockquote><p>Additional notes: Author search and clicking on similarity, citation, references of individual papers automatically create a new search iteration. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!2oJN!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!2oJN!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png 424w, https://substackcdn.com/image/fetch/$s_!2oJN!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png 848w, https://substackcdn.com/image/fetch/$s_!2oJN!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png 1272w, https://substackcdn.com/image/fetch/$s_!2oJN!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!2oJN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png" width="553" height="491" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:491,&quot;width&quot;:553,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:109497,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!2oJN!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png 424w, https://substackcdn.com/image/fetch/$s_!2oJN!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png 848w, https://substackcdn.com/image/fetch/$s_!2oJN!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png 1272w, https://substackcdn.com/image/fetch/$s_!2oJN!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0b075b01-c025-4f27-9a12-210ced812a1a_553x491.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Still confused? Maybe this visual walkthrough will help.</p><h1>A Quick Walkthrough of the New ResearchRabbit</h1><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!GuC6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!GuC6!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png 424w, https://substackcdn.com/image/fetch/$s_!GuC6!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png 848w, https://substackcdn.com/image/fetch/$s_!GuC6!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png 1272w, https://substackcdn.com/image/fetch/$s_!GuC6!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!GuC6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png" width="1456" height="440" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:440,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:305438,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!GuC6!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png 424w, https://substackcdn.com/image/fetch/$s_!GuC6!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png 848w, https://substackcdn.com/image/fetch/$s_!GuC6!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png 1272w, https://substackcdn.com/image/fetch/$s_!GuC6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff15cce78-c27c-441a-8dd4-f97647cb6715_1676x506.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><p>Like any tool in this class, you begin by inputting &#8220;seed papers&#8221;&#8212;relevant articles that kickstart your search. With ResearchRabbit, you can search for papers, select from those already within the platform, or import them using formats like BibTeX, CSV, or RIS.</p><p>The older ResearchRabbit had a two-way sync with Zotero folders; as of this writing, that feature isn&#8217;t yet available in the new version.</p><p>From the first screenshot alone, you can already see Litmaps&#8217; influence, particularly in the ability to classify papers into different color-coded collections. <br></p><h2>Populating with the first seed papers</h2><p>For this walkthrough, I&#8217;ll search and select the first two papers as my seed papers and click search (bottom right).</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!rQ5W!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!rQ5W!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png 424w, https://substackcdn.com/image/fetch/$s_!rQ5W!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png 848w, https://substackcdn.com/image/fetch/$s_!rQ5W!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png 1272w, https://substackcdn.com/image/fetch/$s_!rQ5W!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!rQ5W!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png" width="1456" height="701" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/de9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:701,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:382763,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!rQ5W!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png 424w, https://substackcdn.com/image/fetch/$s_!rQ5W!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png 848w, https://substackcdn.com/image/fetch/$s_!rQ5W!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png 1272w, https://substackcdn.com/image/fetch/$s_!rQ5W!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fde9347d1-bcf3-4c87-83bf-b6f0116b6b03_1846x889.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>From here, you&#8217;ll notice the interface is significantly different from the old ResearchRabbit, drawing considerable inspiration from Litmaps.</p><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!xaGr!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!xaGr!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png 424w, https://substackcdn.com/image/fetch/$s_!xaGr!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png 848w, https://substackcdn.com/image/fetch/$s_!xaGr!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png 1272w, https://substackcdn.com/image/fetch/$s_!xaGr!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!xaGr!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png" width="1456" height="691" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:691,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:629862,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!xaGr!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png 424w, https://substackcdn.com/image/fetch/$s_!xaGr!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png 848w, https://substackcdn.com/image/fetch/$s_!xaGr!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png 1272w, https://substackcdn.com/image/fetch/$s_!xaGr!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd96f30d8-5826-465a-b40c-aff2980ca85c_1866x885.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>In the image above, ResearchRabbit displays recommended articles that are &#8220;similar&#8221; to our two seed articles. While I can&#8217;t be certain, &#8220;similar&#8221; likely refers to text similarity in the title/abstract (akin to <a href="https://medium.com/litmaps/guide-to-litmaps-visualisations-95a9bc2cc9de#:~:text=For%20those%20interested%20in%20the%20technical%20details%3A%20semantic%20embeddings%20are%20computed%20for%20each%20paper%E2%80%99s%20title%20using%20Allen%20AI%E2%80%99s%20SPECTER%20model%20(Cohan%2C%20et%20al.%202020).">Litmaps&#8217; text similarity function (Specter embeddings)</a>).</p><p>In the screenshot above, I have selected 2 papers in the recommended list to add as input papers.</p><p>You can, of course, switch to using citations or references to get a different set of recommended articles. But before we do that, let&#8217;s look at two major new interface changes.<br></p><h2>Customizable Visualization Graph</h2><p>Firstly, the visualization has been completely revamped. By default, papers are displayed as nodes, with the x-axis representing the publication year and the y-axis representing citation count. Arrows indicate the direction of citations. You can also clearly see which papers are already in your collection and which you&#8217;ve just selected as additional input.</p><p>By clicking the &#8220;About&#8221; button at the bottom right of the interface, you can customize what the x-axis, y-axis, and node size represent. </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7OUc!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7OUc!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png 424w, https://substackcdn.com/image/fetch/$s_!7OUc!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png 848w, https://substackcdn.com/image/fetch/$s_!7OUc!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png 1272w, https://substackcdn.com/image/fetch/$s_!7OUc!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7OUc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png" width="1346" height="793" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:793,&quot;width&quot;:1346,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!7OUc!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png 424w, https://substackcdn.com/image/fetch/$s_!7OUc!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png 848w, https://substackcdn.com/image/fetch/$s_!7OUc!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png 1272w, https://substackcdn.com/image/fetch/$s_!7OUc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6f99bde1-8d44-4460-bf29-a0dec389be83_1346x793.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!TI-Y!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!TI-Y!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png 424w, https://substackcdn.com/image/fetch/$s_!TI-Y!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png 848w, https://substackcdn.com/image/fetch/$s_!TI-Y!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png 1272w, https://substackcdn.com/image/fetch/$s_!TI-Y!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!TI-Y!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png" width="446" height="452" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:452,&quot;width&quot;:446,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:38285,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!TI-Y!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png 424w, https://substackcdn.com/image/fetch/$s_!TI-Y!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png 848w, https://substackcdn.com/image/fetch/$s_!TI-Y!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png 1272w, https://substackcdn.com/image/fetch/$s_!TI-Y!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe8486902-6970-4fcb-aed7-e2fc18f5c744_446x452.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>The Y-axis can be customized to use citation count, reference count or publication date. With citation count you can also scale it using log scale rather than just stick to linear scales (useful because citation counts vary greatly).</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7zmV!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7zmV!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png 424w, https://substackcdn.com/image/fetch/$s_!7zmV!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png 848w, https://substackcdn.com/image/fetch/$s_!7zmV!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png 1272w, https://substackcdn.com/image/fetch/$s_!7zmV!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7zmV!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png" width="425" height="470" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:470,&quot;width&quot;:425,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:33079,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7zmV!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png 424w, https://substackcdn.com/image/fetch/$s_!7zmV!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png 848w, https://substackcdn.com/image/fetch/$s_!7zmV!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png 1272w, https://substackcdn.com/image/fetch/$s_!7zmV!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0426cb5e-9b48-4682-968c-ee09a51d40c5_425x470.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>You see the same set of options for the node size.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ivKP!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ivKP!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png 424w, https://substackcdn.com/image/fetch/$s_!ivKP!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png 848w, https://substackcdn.com/image/fetch/$s_!ivKP!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png 1272w, https://substackcdn.com/image/fetch/$s_!ivKP!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ivKP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png" width="430" height="323" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:323,&quot;width&quot;:430,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:26388,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ivKP!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png 424w, https://substackcdn.com/image/fetch/$s_!ivKP!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png 848w, https://substackcdn.com/image/fetch/$s_!ivKP!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png 1272w, https://substackcdn.com/image/fetch/$s_!ivKP!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5e37920e-972f-4fa4-a097-c8d9282e64a6_430x323.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>If you&#8217;ve used Litmaps, these visualization options will be very familiar. That said, <a href="https://docs.litmaps.com/en/articles/9181490-use-and-edit-litmaps-visualization">Litmaps offers more options, such as visualizing by &#8220;momentum&#8221; and &#8220;map connectivity&#8221;, etc. </a></p><p>Personally, I find the default settings quite good, making it easy to spot seminal papers in the top left. However, you can change the settings&#8212;for instance, selecting &#8220;Ref Count&#8221; for node size or the y-axis&#8212;to help identify review papers.</p><h2>Going Down the Rabbit Hole</h2><p>Another, perhaps even more significant, change is what I consider ResearchRabbit&#8217;s greatest improvement. The tool&#8217;s name likely alludes to the iterative citation searching process, which can lead you &#8220;going down the rabbit hole.&#8221;The original </p><p>ResearchRabbit was designed to assist with this, but it listed every iterative stage as a separate column of papers (see below). This often felt overwhelming, and I admit it&#8217;s why, despite loving the concept, I rarely used it seriously. <br></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!_eN-!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!_eN-!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png 424w, https://substackcdn.com/image/fetch/$s_!_eN-!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png 848w, https://substackcdn.com/image/fetch/$s_!_eN-!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png 1272w, https://substackcdn.com/image/fetch/$s_!_eN-!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!_eN-!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png" width="1050" height="675" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:675,&quot;width&quot;:1050,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!_eN-!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png 424w, https://substackcdn.com/image/fetch/$s_!_eN-!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png 848w, https://substackcdn.com/image/fetch/$s_!_eN-!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png 1272w, https://substackcdn.com/image/fetch/$s_!_eN-!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F31de5c63-2bd0-4a69-a139-21f2177ca980_1050x675.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>This is of course very overwhelming, and I admit this is why while I love the idea of ResearchRabbit, I rarely used it seriously.</p><p>With the new ResearchRabbit, much of this complexity is hidden, and the interface primarily shows the visualization of the *last* step. In the example below, I&#8217;ve performed the search four times, but I&#8217;ve &#8220;moved the rabbit backward&#8221; to the third iteration! You can see the rabbit icon is in the 3rd of 4th &#8220;rabbit holes.&#8221; </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Roul!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Roul!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png 424w, https://substackcdn.com/image/fetch/$s_!Roul!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png 848w, https://substackcdn.com/image/fetch/$s_!Roul!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png 1272w, https://substackcdn.com/image/fetch/$s_!Roul!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Roul!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png" width="977" height="678" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:678,&quot;width&quot;:977,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:253914,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Roul!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png 424w, https://substackcdn.com/image/fetch/$s_!Roul!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png 848w, https://substackcdn.com/image/fetch/$s_!Roul!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png 1272w, https://substackcdn.com/image/fetch/$s_!Roul!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F59efaaa4-1029-4a96-83fc-267bffe2426f_977x678.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2>Adding More Papers to Search and Collection</h2><p>Let&#8217;s return to an earlier stage by moving back to the second iteration (where the rabbit icon is in the 2nd &#8220;rabbit hole&#8221;) by clicking on the icon.</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!wDZR!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!wDZR!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png 424w, https://substackcdn.com/image/fetch/$s_!wDZR!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png 848w, https://substackcdn.com/image/fetch/$s_!wDZR!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png 1272w, https://substackcdn.com/image/fetch/$s_!wDZR!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!wDZR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png" width="285" height="125" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/d2a54811-459e-4fd8-92dc-f24c07389151_285x125.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:125,&quot;width&quot;:285,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:22366,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!wDZR!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png 424w, https://substackcdn.com/image/fetch/$s_!wDZR!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png 848w, https://substackcdn.com/image/fetch/$s_!wDZR!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png 1272w, https://substackcdn.com/image/fetch/$s_!wDZR!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fd2a54811-459e-4fd8-92dc-f24c07389151_285x125.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p></p><p>To recap, I started my search with two seed papers. ResearchRabbit then suggested papers &#8220;similar&#8221; to these seed papers, and now I selected three of them as inputs. <br></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!LPCb!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!LPCb!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png 424w, https://substackcdn.com/image/fetch/$s_!LPCb!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png 848w, https://substackcdn.com/image/fetch/$s_!LPCb!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png 1272w, https://substackcdn.com/image/fetch/$s_!LPCb!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!LPCb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png" width="1456" height="706" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/bc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:706,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:604660,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!LPCb!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png 424w, https://substackcdn.com/image/fetch/$s_!LPCb!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png 848w, https://substackcdn.com/image/fetch/$s_!LPCb!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png 1272w, https://substackcdn.com/image/fetch/$s_!LPCb!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fbc68d0df-15f4-4042-901b-73dca6d5a473_1852x898.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>At this stage, these three selected papers are *not* immediately added to my collection. I have two choices:</p><p>1. I can add these three selected papers directly to an existing collection and/or create a new, color-coded collection by clicking on &#8220;save to...&#8221;. </p><p>2. Alternatively, I can choose not to save them at this point.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!OamV!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!OamV!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png 424w, https://substackcdn.com/image/fetch/$s_!OamV!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png 848w, https://substackcdn.com/image/fetch/$s_!OamV!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png 1272w, https://substackcdn.com/image/fetch/$s_!OamV!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!OamV!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png" width="467" height="323" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:323,&quot;width&quot;:467,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:62486,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!OamV!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png 424w, https://substackcdn.com/image/fetch/$s_!OamV!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png 848w, https://substackcdn.com/image/fetch/$s_!OamV!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png 1272w, https://substackcdn.com/image/fetch/$s_!OamV!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F7c3dd743-c03b-464a-bab1-d9496fe99df7_467x323.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Regardless of whether you save the papers to your collection, it&#8217;s important to note that once you&#8217;ve selected these three new input papers, the bottom right of the interface will show you the option to perform another iterative search. This new search will use five selected papers (the 2 original seed articles + the 3 new input papers). Clicking &#8220;search&#8221; here will create another search iteration, causing a new &#8220;rabbit hole&#8221; to appear on the top left. <br></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!F-Hm!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!F-Hm!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png 424w, https://substackcdn.com/image/fetch/$s_!F-Hm!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png 848w, https://substackcdn.com/image/fetch/$s_!F-Hm!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png 1272w, https://substackcdn.com/image/fetch/$s_!F-Hm!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!F-Hm!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png" width="1456" height="696" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:696,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:611556,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!F-Hm!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png 424w, https://substackcdn.com/image/fetch/$s_!F-Hm!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png 848w, https://substackcdn.com/image/fetch/$s_!F-Hm!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png 1272w, https://substackcdn.com/image/fetch/$s_!F-Hm!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F3c9ac871-640e-4f36-abcb-cf47890d02ee_1880x899.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>However, before proceeding with that search, you might want to adjust the settings to look at either the citations or references of your *initial* two seed papers by changing the setting on the top left. </p><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!85Q2!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!85Q2!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png 424w, https://substackcdn.com/image/fetch/$s_!85Q2!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png 848w, https://substackcdn.com/image/fetch/$s_!85Q2!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png 1272w, https://substackcdn.com/image/fetch/$s_!85Q2!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!85Q2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png" width="1456" height="800" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/017774e8-c818-417d-b064-7d63aea1f797_1485x816.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:800,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:213820,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!85Q2!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png 424w, https://substackcdn.com/image/fetch/$s_!85Q2!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png 848w, https://substackcdn.com/image/fetch/$s_!85Q2!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png 1272w, https://substackcdn.com/image/fetch/$s_!85Q2!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F017774e8-c818-417d-b064-7d63aea1f797_1485x816.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Besides finding recommended papers by similarity/citations/references, ResearchRabbit also offers other settings to refine recommended articles, such as limiting by:</p><p>a) Specific keywords</p><p>b) Publication date</p><p>c) SJR Quartiles</p><p>d) H-index of the journal</p><p>e) H-index of the journal</p><p>f) Excluding retractions</p><p>However, these advanced settings are exclusively available for paid accounts.</p><p>Let&#8217;s assume you choose to look for recommendations based on references of the two original seed papers and click &#8220;save.&#8221; </p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!o55M!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!o55M!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png 424w, https://substackcdn.com/image/fetch/$s_!o55M!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png 848w, https://substackcdn.com/image/fetch/$s_!o55M!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png 1272w, https://substackcdn.com/image/fetch/$s_!o55M!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!o55M!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png" width="1456" height="710" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/e0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:710,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:484655,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!o55M!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png 424w, https://substackcdn.com/image/fetch/$s_!o55M!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png 848w, https://substackcdn.com/image/fetch/$s_!o55M!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png 1272w, https://substackcdn.com/image/fetch/$s_!o55M!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fe0a5341c-c168-49d0-8718-2fe6157837ae_1876x915.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>In the image above, ResearchRabbit is displaying recommendations based on the references of the 2 original seed papers, and I have selected one of them. This results in 4 selected papers on the right (3 found via &#8220;similar&#8221; and 1 found via &#8220;references&#8221; of the 2 seed papers). This is why the search setting now shows a total of 6 articles (the 2 seed papers + 4 input papers).</p><blockquote><p>For those technically minded or just worry about reproducibility, you might wonder is ResearchRabbit literally just showing direct references from the seed papers (including input papers) or are they doing something complicated like bibliographic coupling, co-citations or some other blend of bibliometric/network analysis method? I have no clue, though a casual glance seems to me, it is just direct references.</p></blockquote><p>It is important to note that changing the settings&#8212;from &#8220;similar&#8221; to &#8220;references&#8221; to &#8220;citations&#8221;&#8212;is not considered a search iteration and does not create a new &#8220;research rabbit hole&#8221; at the top of the interface.</p><p>Note: Besides searching for citations and references, you can also use authors to search for papers, but I rarely find it useful.</p><blockquote><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!VcrU!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!VcrU!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png 424w, https://substackcdn.com/image/fetch/$s_!VcrU!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png 848w, https://substackcdn.com/image/fetch/$s_!VcrU!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png 1272w, https://substackcdn.com/image/fetch/$s_!VcrU!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!VcrU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png" width="531" height="549" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:549,&quot;width&quot;:531,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:41990,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!VcrU!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png 424w, https://substackcdn.com/image/fetch/$s_!VcrU!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png 848w, https://substackcdn.com/image/fetch/$s_!VcrU!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png 1272w, https://substackcdn.com/image/fetch/$s_!VcrU!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F948d556a-a444-48c0-be5a-a8ccf2e1339a_531x549.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p></blockquote><p>Typically, to be more thorough, I would change the setting to &#8220;citations&#8221; of the 2 seed papers to find more input papers. But let&#8217;s say I do that and find no more relevant ones. Now I am ready to click the search button on the bottom right, which will initiate a new &#8220;Search iteration&#8221; using all 6 input papers.</p><blockquote><p>Note: Currently, I have 3 additional papers in my collection (in addition to the 2 seed papers), but the latest input paper is not in any collection because I did not perform the &#8220;save to...&#8221; step.</p></blockquote><p>Next, I used the 6 input papers (original 2 seed papers + 3 input papers from similairy + 1 input paper from reference) to run another search iteration (this time using &#8220;references&#8221;). Here, I added 2 more input papers, means the next search will be based on 8 papers and the cycle continues.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!jzvs!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!jzvs!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png 424w, https://substackcdn.com/image/fetch/$s_!jzvs!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png 848w, https://substackcdn.com/image/fetch/$s_!jzvs!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png 1272w, https://substackcdn.com/image/fetch/$s_!jzvs!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!jzvs!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png" width="1456" height="721" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/eac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:721,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:592847,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!jzvs!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png 424w, https://substackcdn.com/image/fetch/$s_!jzvs!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png 848w, https://substackcdn.com/image/fetch/$s_!jzvs!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png 1272w, https://substackcdn.com/image/fetch/$s_!jzvs!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feac2ae37-21b4-4739-8487-08ea2bb3d174_1845x914.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p></p><blockquote><p>The &#8220;rabbit hole&#8221; icons now show that I am in the last step of the 3rd iteration. Previously, I was in the 2nd iteration of 4th (the rabbit icon was in the 2nd rabbit hole out of 4). It seems that in ResearchRabbit, if you move to an older iteration and search from there, it starts a new branch from that point and wipes out the other &#8220;future iterations&#8221;</p></blockquote><h2>Another way to save papers</h2><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!HIpO!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!HIpO!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png 424w, https://substackcdn.com/image/fetch/$s_!HIpO!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png 848w, https://substackcdn.com/image/fetch/$s_!HIpO!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png 1272w, https://substackcdn.com/image/fetch/$s_!HIpO!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!HIpO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png" width="237" height="128" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:128,&quot;width&quot;:237,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:9019,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!HIpO!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png 424w, https://substackcdn.com/image/fetch/$s_!HIpO!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png 848w, https://substackcdn.com/image/fetch/$s_!HIpO!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png 1272w, https://substackcdn.com/image/fetch/$s_!HIpO!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F77a7e538-24eb-4871-9018-3ee5cb32abe6_237x128.png 1456w" sizes="100vw" loading="lazy"></picture><div></div></div></a></figure></div><p>While you can add input papers to your collections along the way, another alternative is to perform all your iterative searches first (selecting input papers at each step). When you want to end the process, click the &#8220;X&#8221; icon next to the trail of rabbit holes. </p><p>On the next screen, you will be prompted to add these papers to your collection.</p><p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!KIPB!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!KIPB!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png 424w, https://substackcdn.com/image/fetch/$s_!KIPB!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png 848w, https://substackcdn.com/image/fetch/$s_!KIPB!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png 1272w, https://substackcdn.com/image/fetch/$s_!KIPB!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!KIPB!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png" width="1407" height="853" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:853,&quot;width&quot;:1407,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:266951,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!KIPB!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png 424w, https://substackcdn.com/image/fetch/$s_!KIPB!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png 848w, https://substackcdn.com/image/fetch/$s_!KIPB!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png 1272w, https://substackcdn.com/image/fetch/$s_!KIPB!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1266b268-3f75-4d24-8395-f063c1d65528_1407x853.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><h2>Paid versus Free Account</h2><p>As mentioned, this new version of ResearchRabbit now offers a premium version. What do you get with that?</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!aFyc!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!aFyc!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png 424w, https://substackcdn.com/image/fetch/$s_!aFyc!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png 848w, https://substackcdn.com/image/fetch/$s_!aFyc!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png 1272w, https://substackcdn.com/image/fetch/$s_!aFyc!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!aFyc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png" width="966" height="661" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:661,&quot;width&quot;:966,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:69364,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://aarontay.substack.com/i/177676779?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!aFyc!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png 424w, https://substackcdn.com/image/fetch/$s_!aFyc!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png 848w, https://substackcdn.com/image/fetch/$s_!aFyc!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png 1272w, https://substackcdn.com/image/fetch/$s_!aFyc!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff9349b79-5fed-432a-a70e-bd8f5dcb29da_966x661.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Firstly, you can search with a maximum of 300 input papers (as opposed to 50 for free).</p><p>Secondly, you gain access to the advanced settings mentioned earlier. I think this is the feature people want the most; for example, some users will want to look only at papers in top journals. I understand the need for ResearchRabbit to earn revenue, still, it would have been nice if ResearchRabbit gave free users the ability to filter out retractions, as this seems like a critical feature to improve research.</p><p>Thirdly, while the free account allows for unlimited collections, you can only create one &#8220;research project&#8221; per account. This probably isn&#8217;t as critical because, assuming your collections are distinct, they essentially function as projects.</p><h2>Conclusion</h2><p>Overall, the newer ResearchRabbit seems to be an improvement over the original, with a less crowded and messy interface. Also, you can see the obvious, heavy influence of the partnership with Litmaps. However, in my opinion, ResearchRabbit&#8217;s interface is easier to understand, though it may have less functionality.</p><p>That said, the &#8220;rabbit hole&#8221; interface and its metaphor are not as intuitive as they could be, and it took me a while to figure out what triggered a &#8220;rabbit hole&#8221; creation versus what did not. But I guess for most people, understanding this distinction isn&#8217;t important, as they just want to iterate quickly among the options without documenting every step.</p><p>It&#8217;s a pity the advanced search filters are hidden behind a paywall, but that&#8217;s the point of a premium service, I suppose&#8212;to offer desirable features.</p><p>All in all, the 2025 redesign makes <strong>iterative chaining</strong> in ResearchRabbit genuinely usable: fewer UI distractions. For most exploratory tasks, the <strong>free tier</strong> is enough; if you need journal-level filters, maybe <strong>Litmaps Pro</strong> provides more value?. For a fast single-seed overview, <strong>Connected Papers</strong> remains the quickest on-ramp. </p><p>Of course, for the most transparent tool for systematic review use , the free <a href="https://www.eshackathon.org/software/citationchaser.html">citationchaser</a> is by far the most popular.</p>]]></content:encoded></item><item><title><![CDATA[“We’re Good at Search”… Just Not the Kind That the AI era Demands - a Provocation]]></title><description><![CDATA[I might be exaggerating slightly, but if you look at the few new evaluation matrices for AI-powered search circulating, &#8220;relevancy&#8221; is often just one of several categories, evaluated in a highly subjective and &#8220;I-know-it-when-I-see-it&#8221; manner.&#160;This is baffling, given that a search engine (AI-powered or not) lives and dies on its ability to retrieve relevant results. Even generative tools that author reports are building on a house of cards if their underlying retrieval system fails to find the most relevant items.]]></description><link>https://aarontay.substack.com/p/were-good-at-search-just-not-the</link><guid isPermaLink="false">https://aarontay.substack.com/p/were-good-at-search-just-not-the</guid><dc:creator><![CDATA[Aaron Tay]]></dc:creator><pubDate>Thu, 23 Oct 2025 16:16:06 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!SIBS!,w_256,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdabe20d0-c305-4694-b04d-13176319efee_440x440.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<p>Recently, a librarian from a prestigious institution I met at a conference surprised me when he confessed that he and his colleagues were struggling to grasp the issues surrounding the impact of AI. But My talk helped clarify much of the fog around how to think about impact of AI on search.</p><p>His confession wasn&#8217;t an isolated one. Many librarians I speak with admit they struggle to keep up with the blizzard of new AI-powered search engines. More importantly, I sense that many of us lack the right mental models to properly discuss, analyze, and evaluate them.</p><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://ko-fi.com/aarontay&quot;,&quot;text&quot;:&quot;Buy me Coffee! (via ko-fi)&quot;,&quot;action&quot;:null,&quot;class&quot;:null}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://ko-fi.com/aarontay"><span>Buy me Coffee! (via ko-fi)</span></a></p><h2>The Pressure We Feel</h2><p>Here&#8217;s the uncomfortable truth: we librarians have long held a self-image as masters of search&#8212;or at least, competent practitioners. This identity creates immense pressure to stay on top of &#8220;AI search&#8221; and project understanding. Yet many of us quietly feel inadequate, struggling to reconcile our traditional expertise with these emerging tools.</p><p>The reality is that we are good at searching&#8212;just in ways that differ from what may be needed now.</p><h2>What We&#8217;ve Always Been Good At</h2><p>Our traditional strengths in search are considerable. The best reference librarians among us possess remarkable resourcefulness, drawing from numerous sources and techniques to unearth answers that would elude even the most persistent Google user. In our domains of expertise, we can locate information&#8212;both online and offline&#8212;that others simply cannot find.</p><p>Many of us have mastered database searching within a specific paradigm: Boolean retrieval, ranking by TF-IDF or BM25. We are experts at the use of proximity operators and filters, while the finest medical librarians know MeSH like the back of their hand. Others have equivalent expertise in LCSH or specialized thesauri.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://aarontay.substack.com/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Thanks for reading Aaron Tay's Musings about Librarianship! Subscribe for free to receive new posts and support my work.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p>Evidence synthesis librarians come closest to theoretical information retrieval expertise, with their knowledge of piloting searches, validating hedges, and understanding retrieval metrics like sensitivity, precision, specificity, and negative predictive value. Some even research stopping points for active learning tools like ASReview. </p><p>[Added Nov 2025] I would say the knowledge to conduct the relatively new <a href="https://onlinelibrary.wiley.com/doi/10.1111/jebm.12505">SWAR or Study within a review (SWAR) </a>is approximately the type of skillset that we need that is rare among librarians</p><blockquote><p>Another area that is search related is how we teach users to use SIFT (which involves searching to do lateral reading); this is likely to shift also now that we have extremely powerful search tools like <a href="https://search.google/ways-to-search/ai-mode/">Google&#8217;s AI mode</a> to <a href="https://aarontay.substack.com/p/googles-ai-mode-it-can-out-search">do the heavy lifting of searching to help the human with validation</a>&#8212;see <a href="https://mikecaulfield.substack.com/p/my-youtube-ai-mode-infolit-hoedown">the work of Mike Caulfield of SIFT fame on how to do this in a emerging and exciting new area.</a></p></blockquote><p>The problem? These hard-won skills offer little preparation for the world we live in now.</p><p>We now inhabit a world defined by unfamiliar terminology: natural language search, semantic search, dense embeddings, vector embeddings, retrieval augmented generation, deep research, agentic search. These aren&#8217;t just buzzwords&#8212;they <em>represent <a href="https://www.youtube.com/watch?v=Ju-JS_sp73U">fundamentally different families of approaches to information retrieval with different trade-offs and implications as we move beyond just Boolean search</a>.</em></p><blockquote><p>I&#8217;m skating over a crucial question here: are these AI advancements genuine improvements over traditional search methods, or are we caught up early in a hype cycle with little real benefits? e.g. Does semantic search really retrieve more relevant results for scholarly research, or does it just feel more modern? Even if these methods do objectively get you higher recall, precision results, is it worth the costs you pay in<a href="https://aarontay.substack.com/p/the-reproducibility-and"> reduced interpretability, reproducibility</a>,<a href="https://aarontay.substack.com/p/the-ai-powered-library-search-that"> unknown possibility of bias</a> and <a href="https://aarontay.substack.com/p/the-case-of-the-vanishing-hit-count">the lack of exact search hits</a>? Also, there are legitimate reasons why medical librarians still depend on Boolean search with MeSH&#8212;precision, control, and reproducibility matter, especially for systematic reviews and evidence synthesis.</p><p>I&#8217;ll address this tension directly in my next post. But for now, let me argue that regardless of where you stand on the &#8220;improvement vs. hype&#8221; question, librarians need to understand these technologies well enough to critically evaluate them.</p></blockquote><h2>Our Evaluation Blind Spot - a Provocation</h2><p>This brings us to an odd thing I have noticed.</p><p>When librarians assess a new search engine or database (AI-powered or not), I notice we often focus on familiar factors: the UI, the availability of filters, the sources covered, privacy terms, vendor support, and even niche library requirements like COUNTER support or link resolver integration.</p><p>Strangely, the effectiveness of the core relevancy system is, if not an afterthought, rarely the central focus.</p><p>I might be exaggerating slightly, but if you look at the few new evaluation matrices for AI-powered search circulating, &#8220;relevancy&#8221; is often just one of several categories, evaluated in a highly subjective and &#8220;I-know-it-when-I-see-it&#8221; manner. </p><p><em>This is baffling, given that a search engine (AI-powered or not) lives and dies on its ability to retrieve relevant results</em>. Even generative tools that author reports are building on a house of cards if their underlying retrieval system fails to find the most relevant items.</p><blockquote><p>I am not saying features like link resolver support aren&#8217;t important. But notice the asymmetry here, it is far easier for a product with proven good relevancy models to build link resolver support than the reverse. Also, I&#8217;ve noticed, most feature &#8220;innovations&#8221; like specific visualizations in Deep Research tools are easily and quickly copied. Unfortunately, relevancy models are much harder to copy. All this makes it even important to double down on choosing products by how good they are at retrieval.</p></blockquote><p></p><p>Why this blind spot? Let me advance a hypothesis. </p><p>Because for the last 15 or 20 years, academic databases have all <em>functioned in fundamentally the same way. </em> </p><ul><li><p>Index content in an inverted index</p></li><li><p>Retrieve with Boolean</p></li><li><p>Rank with some variant of TF-IDF or BM25</p></li></ul><p>This is admittedly oversimplified (we glide past BM25F, proximity, citation/authority, and learning-to-rank in some academic systems.)  and things like Google and Google Scholar break the mold, (which is also why we initially struggled with them) but in such a world, the main differentiator wasn&#8217;t usually the retrieval algorithm&#8212;which was a commodity. The main things that mattered were coverage (which journals do you have?) and, secondarily, the user-friendliness of the interface.  </p><h2>The Wild West of AI-Powered Search</h2><p>Today&#8217;s landscape couldn&#8217;t be more different. </p><p>Many of the new AI search engines (like Elicit, Consensus, Undermind, etc.) are drawing from the same pool of open content (like Semantic Scholar or OpenAlex). They are competing almost <em>entirely</em> on the difference in their retrieval and ranking capabilities.</p><p>Unlike a decade or two ago, there is little standardization and we&#8217;re witnessing an explosion of search innovation fueled by transformer models&#8212;affecting embeddings, LLM-based reranking, agentic search, and more.</p><p>This is the wild west, and implementations vary wildly; the gap between the best and the merely flashy is large.  </p><blockquote><p>Proper independent, task-grounded evaluations are still rare for off-the-shelf AI powered academic search tools, but the ones I have seen tend to list the usual suspects - Undermind.ai, Elicit.com (the paid version - the free research report flow is too limited), constantly at or near the top - showing excellence of retrieval algo is not just subjective or random.</p><p>On the other end of the spectrum, I have unfortunately seen many lazy and horrible implementations - e.g. Just naively prompting a LLM to generate Boolean search strategy and thinking it will give good relevancy results</p></blockquote><h2>A Glimpse of the Future</h2><p>This trend will accelerate. In a potential future where content owners provide access via MCP (Model Context Protocol) - like a <a href="https://newsroom.wiley.com/press-releases/press-release-details/2025/Wiley-Launches-Interoperable-Platform-to-Power-Scientific-Discovery-in-Worlds-Leading-AI-Technologies/default.aspx">Wiley AI Gateway</a>, the content pool becomes even more equalized assuming the agent would have the same entitlement as the user. The only thing distinguishing one search agent from another will be its retrieval capability&#8212;its &#8220;secret sauce&#8221; for finding the best results.</p><blockquote><p>In an MCP-dominated landscape, search agents wouldn&#8217;t directly control what&#8217;s returned&#8212;they&#8217;d specify queries while configured tools handle the actual retrieval. This would make agents more similar than in a world where each maintains centralized indexes, though they&#8217;d still distinguish themselves by strategic decisions about what to search and which sources to prioritize.</p></blockquote><h2>The Path Forward</h2><blockquote><p>Theoretical knowledge without practical experience is <strong>sterile</strong>, but practical knowledge without theoretical understanding is <strong>blind</strong>.</p></blockquote><p>My proposal is straightforward: librarians today should develop competency in information retrieval as a discipline.</p><p>These include understanding how vector embeddings work, what makes semantic search different, how retrieval augmented generation functions, and how to test retrieval performance formally. Incidentally, all this and more are discussed on this blog!</p><p>But theory alone isn&#8217;t enough&#8212;this knowledge needs to be paired with hands-on experimentation and testing. Run actual searches. Compare results. Break things in controlled ways to understand their failure modes. Only then can you bridge the gap between knowing <em>why</em> a system should work and seeing <em>how</em> it actually behaves with real queries and real collections.</p><p>Without theory, you&#8217;re reduced to blind trial-and-error with no ability to make connections. Without practice, you&#8217;re working from assumptions that may not survive contact with messy reality. Both matters.</p><p>While I cannot give you the practical experience from trying these tools out, I can try to give you the theoretical foundation. This is why <a href="https://www.linkedin.com/posts/aarontay_libraryscience-aiinlibraries-informationretrieval-activity-7386594246587260928-_goY?utm_source=share&amp;utm_medium=member_desktop&amp;rcm=ACoAAADydNkB8cFBZ48tGuFjE4yHqQ6N6mBWEyE">we&#8217;re developed a workshop on these topics</a>. </p><p>The landscape has shifted. It&#8217;s time our understanding shifted with it.<strong> </strong></p><div class="comment" data-attrs="{&quot;url&quot;:&quot;https://open.substack.com/home&quot;,&quot;commentId&quot;:168887016,&quot;comment&quot;:{&quot;id&quot;:168887016,&quot;date&quot;:&quot;2025-10-22T03:29:09.521Z&quot;,&quot;edited_at&quot;:null,&quot;body&quot;:&quot;Semantic search. Natural language search. RAG. Deep research. It&#8217;s no exaggeration to say we're witnessing a paradigm shift in search, and librarians and researchers need to understand these changes.\n\nThat's why I've teamed up with my colleague, Senior Librarian Bella Ratmelia, to offer AI-Powered Search in Libraries: A Crash Course on Understanding the Fundamentals for Library Professionals.\n\nWe first ran this comprehensive 3-session (3 hour each!) course in July 2025 under the auspices of FSCI 2025. The course covered fundamentals of information retrieval and&#8212;more importantly&#8212;the implications for searchers, librarians, and publishers as we incorporate these new search innovations. It was a hit, with 60 registrations and oversubscribed waitlists!\n\nFor more details about the course - https://www.charleston-hub.com/wp-content/uploads/2025/07/Charleston-Conference-Asia-FSCI-Workshop-3.pdf \n\nBased on what we learned, we're offering a second run at the Charleston Conference Asia preconference workshop in Bangkok, January 26-28, 2025.Can't make it to Bangkok? \n\nWe now offer:- Fully virtual option: $75 USD- Hybrid option: $150 USD (includes in-person Session 3 in Bangkok, requires additional main conference registration)\n\nSchedule:\n\nSession 1 (online): Monday, January 19, 2026 - 9:00 am &#8211; 12:00 pm ICT (UTC+7) \n\nSession 2 (online): Wednesday, January 21, 2026 -  9:00 am &#8211; 12:00 pm ICT (UTC+7)\n\nSession 3 (hybrid): Monday, January 26, 2026 - 9:00 am &#8211; 12:00 pm ICT (UTC+7)To register: \n\nVisit  https://www.charleston-hub.com/charleston-conference-asia/registration/   \n\nVirtual only: Scroll down to \&quot;FSCI Workshops (Optional)\&quot; and select \&quot;Attend this\&quot; ($75) next to Course 3 \n\nHybrid option: Register for the main conference AND select \&quot;Attend this\&quot; ($150) next to Course 3  \n\nBella and I are excited to present this course again, hope to see you there!&quot;,&quot;body_json&quot;:{&quot;type&quot;:&quot;doc&quot;,&quot;attrs&quot;:{&quot;schemaVersion&quot;:&quot;v1&quot;},&quot;content&quot;:[{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Semantic search. Natural language search. RAG. Deep research. It&#8217;s no exaggeration to say we're witnessing a paradigm shift in search, and librarians and researchers need to understand these changes.&quot;}]},{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;That's why I've teamed up with my colleague, Senior Librarian Bella Ratmelia, to offer AI-Powered Search in Libraries: A Crash Course on Understanding the Fundamentals for Library Professionals.&quot;}]},{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;We first ran this comprehensive 3-session (3 hour each!) course in July 2025 under the auspices of FSCI 2025. The course covered fundamentals of information retrieval and&#8212;more importantly&#8212;the implications for searchers, librarians, and publishers as we incorporate these new search innovations. It was a hit, with 60 registrations and oversubscribed waitlists!&quot;}]},{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;For more details about the course - &quot;},{&quot;type&quot;:&quot;text&quot;,&quot;marks&quot;:[{&quot;type&quot;:&quot;link&quot;,&quot;attrs&quot;:{&quot;href&quot;:&quot;https://www.charleston-hub.com/wp-content/uploads/2025/07/Charleston-Conference-Asia-FSCI-Workshop-3.pdf&quot;,&quot;target&quot;:&quot;_blank&quot;,&quot;rel&quot;:&quot;nofollow ugc noopener&quot;,&quot;class&quot;:&quot;note-link&quot;}}],&quot;text&quot;:&quot;https://www.charleston-hub.com/wp-content/uploads/2025/07/Charleston-Conference-Asia-FSCI-Workshop-3.pdf&quot;}]},{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Based on what we learned, we're offering a second run at the Charleston Conference Asia preconference workshop in Bangkok, January 26-28, 2025.Can't make it to Bangkok? &quot;}]},{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;We now offer:- Fully virtual option: $75 USD- Hybrid option: $150 USD (includes in-person Session 3 in Bangkok, requires additional main conference registration)&quot;}]},{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Schedule:&quot;}]},{&quot;type&quot;:&quot;bulletList&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;listItem&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Session 1 (online): Monday, January 19, 2026 - 9:00 am &#8211; 12:00 pm ICT (UTC+7) &quot;}]}]},{&quot;type&quot;:&quot;listItem&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Session 2 (online): Wednesday, January 21, 2026 -  9:00 am &#8211; 12:00 pm ICT (UTC+7)&quot;}]}]},{&quot;type&quot;:&quot;listItem&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Session 3 (hybrid): Monday, January 26, 2026 - 9:00 am &#8211; 12:00 pm ICT (UTC+7)To register: &quot;}]},{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Visit  &quot;},{&quot;type&quot;:&quot;text&quot;,&quot;marks&quot;:[{&quot;type&quot;:&quot;link&quot;,&quot;attrs&quot;:{&quot;href&quot;:&quot;https://www.charleston-hub.com/charleston-conference-asia/registration/&quot;,&quot;target&quot;:&quot;_blank&quot;,&quot;rel&quot;:&quot;nofollow ugc noopener&quot;,&quot;class&quot;:&quot;note-link&quot;}}],&quot;text&quot;:&quot;https://www.charleston-hub.com/charleston-conference-asia/registration/&quot;}]}]}]},{&quot;type&quot;:&quot;bulletList&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;listItem&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Virtual only: Scroll down to \&quot;FSCI Workshops (Optional)\&quot; and select \&quot;Attend this\&quot; ($75) next to Course 3 &quot;}]}]},{&quot;type&quot;:&quot;listItem&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Hybrid option: Register for the main conference AND select \&quot;Attend this\&quot; ($150) next to Course 3  &quot;}]},{&quot;type&quot;:&quot;paragraph&quot;,&quot;content&quot;:[{&quot;type&quot;:&quot;text&quot;,&quot;text&quot;:&quot;Bella and I are excited to present this course again, hope to see you there!&quot;}]}]}]}]},&quot;restacks&quot;:0,&quot;reaction_count&quot;:0,&quot;attachments&quot;:[{&quot;id&quot;:&quot;a05aa7bf-ae4b-4b10-9161-1d7255010863&quot;,&quot;type&quot;:&quot;image&quot;,&quot;imageUrl&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/7b77eccc-2d8c-49ed-ab8d-3a8eaff7c09e_667x873.png&quot;,&quot;imageWidth&quot;:667,&quot;imageHeight&quot;:873,&quot;explicit&quot;:false},{&quot;id&quot;:&quot;6f2d686b-52ff-4a39-ac07-2217238fe7d0&quot;,&quot;type&quot;:&quot;link&quot;,&quot;linkMetadata&quot;:{&quot;url&quot;:&quot;https://www.charleston-hub.com/charleston-conference-asia/registration/&quot;,&quot;host&quot;:&quot;charleston-hub.com&quot;,&quot;title&quot;:&quot;Registration - Charleston Hub&quot;,&quot;description&quot;:&quot;May 28, 2025 - -&quot;,&quot;image&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/07a762bb-05ab-43ea-a9ca-ae4e1b93121d_800x200.png&quot;,&quot;original_image&quot;:&quot;https://www.charleston-hub.com/wp-content/uploads/2020/10/REGISTER-NOW-1.png&quot;},&quot;explicit&quot;:false}],&quot;name&quot;:&quot;Aaron Tay&quot;,&quot;user_id&quot;:10210801,&quot;photo_url&quot;:&quot;https://substackcdn.com/image/fetch/f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fbucketeer-e05bbc84-baa3-437e-9518-adb32be77984.s3.amazonaws.com%2Fpublic%2Fimages%2Ff39219af-fee4-4db6-a3e1-47bb76350df6_314x280.jpeg&quot;,&quot;user_bestseller_tier&quot;:null,&quot;userStatus&quot;:{&quot;bestsellerTier&quot;:null,&quot;subscriberTier&quot;:null,&quot;leaderboard&quot;:null,&quot;vip&quot;:false,&quot;badge&quot;:null,&quot;paidPublicationIds&quot;:[],&quot;subscriber&quot;:null}},&quot;source&quot;:null,&quot;forumChannel&quot;:null}" data-component-name="CommentPlaceholder"></div><p><strong> </strong></p><p></p><p></p>]]></content:encoded></item></channel></rss>