{"exhaustive":{"nbHits":false,"typo":false},"exhaustiveNbHits":false,"exhaustiveTypo":false,"hits":[{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"thm"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"<em>RAGFlow</em> is an open-source RAG engine based on OCR and document parsing"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://github.com/infiniflow/<em>ragflow</em>"}},"_tags":["story","author_thm","story_39896923"],"author":"thm","children":[39897959,39898012,39899351,39900324,39900338,39900598,39900736,39901356,39901380,39901514,39901877,39903108,39903304,39903439,39906512],"created_at":"2024-04-01T17:50:54Z","created_at_i":1711993854,"num_comments":53,"objectID":"39896923","points":230,"story_id":39896923,"title":"RAGFlow is an open-source RAG engine based on OCR and document parsing","updated_at":"2025-10-21T16:12:10Z","url":"https://github.com/infiniflow/ragflow"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"vissidarte_choi"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"<em>RAGFlow</em>: Modern Agentic RAG Based on Graph"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://<em>ragflow</em>.io/blog/<em>ragflow</em>-enters-agentic-era"}},"_tags":["story","author_vissidarte_choi","story_40936082"],"author":"vissidarte_choi","children":[40936083,40936133,40936227],"created_at":"2024-07-11T12:43:55Z","created_at_i":1720701835,"num_comments":5,"objectID":"40936082","points":13,"story_id":40936082,"title":"RAGFlow: Modern Agentic RAG Based on Graph","updated_at":"2025-01-09T02:16:18Z","url":"https://ragflow.io/blog/ragflow-enters-agentic-era"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"vissidarte_choi"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"DeepSeek-V2 integrated, <em>RAGFlow</em> v0.5.0 is released"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://github.com/infiniflow/<em>ragflow</em>/releases/tag/v0.5.0"}},"_tags":["story","author_vissidarte_choi","story_40294775"],"author":"vissidarte_choi","created_at":"2024-05-08T05:54:31Z","created_at_i":1715147671,"num_comments":0,"objectID":"40294775","points":7,"story_id":40294775,"title":"DeepSeek-V2 integrated, RAGFlow v0.5.0 is released","updated_at":"2024-09-20T17:05:21Z","url":"https://github.com/infiniflow/ragflow/releases/tag/v0.5.0"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"vissidarte_choi"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"<em>RAGFlow</em>: Customizable, explainable RAG engine based on doc structure recognition"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://medium.com/@infiniflowai/<em>ragflow</em>-customizable-credible-explainable-rag-engine-based-on-document-structure-recognition-6a2a2369bd2a"}},"_tags":["story","author_vissidarte_choi","story_39912056"],"author":"vissidarte_choi","created_at":"2024-04-02T23:44:21Z","created_at_i":1712101461,"num_comments":0,"objectID":"39912056","points":7,"story_id":39912056,"title":"RAGFlow: Customizable, explainable RAG engine based on doc structure recognition","updated_at":"2024-09-20T16:45:09Z","url":"https://medium.com/@infiniflowai/ragflow-customizable-credible-explainable-rag-engine-based-on-document-structure-recognition-6a2a2369bd2a"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"vissidarte_choi"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"<em>RAGFlow</em> 15.0 Deep Dive: DeepDoc model upgrades, Enhanced Agent, new RAG strategy"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://<em>ragflow</em>.io/blog/a-deep-dive-into-<em>ragflow</em>-v0.15.0"}},"_tags":["story","author_vissidarte_choi","story_42460501"],"author":"vissidarte_choi","created_at":"2024-12-19T11:37:52Z","created_at_i":1734608272,"num_comments":0,"objectID":"42460501","points":4,"story_id":42460501,"title":"RAGFlow 15.0 Deep Dive: DeepDoc model upgrades, Enhanced Agent, new RAG strategy","updated_at":"2024-12-19T11:42:59Z","url":"https://ragflow.io/blog/a-deep-dive-into-ragflow-v0.15.0"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"YongtengRey"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Open source end-to-end RAG-based Deep Research implemented within <em>RAGFlow</em>"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://<em>ragflow</em>.io/docs/dev/release_notes"}},"_tags":["story","author_YongtengRey","story_43253467"],"author":"YongtengRey","children":[43253468],"created_at":"2025-03-04T12:00:34Z","created_at_i":1741089634,"num_comments":0,"objectID":"43253467","points":3,"story_id":43253467,"title":"Open source end-to-end RAG-based Deep Research implemented within RAGFlow","updated_at":"2025-03-04T12:15:59Z","url":"https://ragflow.io/docs/dev/release_notes"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"yingfeng"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"<em>RAGFlow</em> 0.9 is released to support GraphRAG end-to-end"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://github.com/infiniflow/<em>ragflow</em>/releases/tag/v0.9.0"}},"_tags":["story","author_yingfeng","story_41170397"],"author":"yingfeng","children":[41170647],"created_at":"2024-08-06T12:53:28Z","created_at_i":1722948808,"num_comments":0,"objectID":"41170397","points":3,"story_id":41170397,"title":"RAGFlow 0.9 is released to support GraphRAG end-to-end","updated_at":"2024-09-20T17:36:19Z","url":"https://github.com/infiniflow/ragflow/releases/tag/v0.9.0"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"NonStopOyster"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Unpatched vuln in <em>RAGFlow</em> allows for post-auth RCE"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://zeropath.com/blog/<em>ragflow</em>-rce-unpatched-vulnerability"}},"_tags":["story","author_NonStopOyster","story_47754820"],"author":"NonStopOyster","children":[47754821],"created_at":"2026-04-13T16:52:44Z","created_at_i":1776099164,"num_comments":0,"objectID":"47754820","points":2,"story_id":47754820,"title":"Unpatched vuln in RAGFlow allows for post-auth RCE","updated_at":"2026-04-13T18:44:20Z","url":"https://zeropath.com/blog/ragflow-rce-unpatched-vulnerability"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"saikatsg"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"<em>Ragflow</em>: fuses RAG with Agent capabilities to create context layer for LLMs"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://github.com/infiniflow/<em>ragflow</em>"}},"_tags":["story","author_saikatsg","story_47313655"],"author":"saikatsg","created_at":"2026-03-09T18:54:37Z","created_at_i":1773082477,"num_comments":0,"objectID":"47313655","points":2,"story_id":47313655,"title":"Ragflow: fuses RAG with Agent capabilities to create context layer for LLMs","updated_at":"2026-03-09T19:15:13Z","url":"https://github.com/infiniflow/ragflow"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"vissidarte_choi"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Integrated Rerankers, implemented RAPTOR, <em>RAGFlow</em> 0.7 released"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://github.com/infiniflow/<em>ragflow</em>/releases/tag/v0.7.0"}},"_tags":["story","author_vissidarte_choi","story_40522767"],"author":"vissidarte_choi","created_at":"2024-05-30T12:12:24Z","created_at_i":1717071144,"num_comments":0,"objectID":"40522767","points":2,"story_id":40522767,"title":"Integrated Rerankers, implemented RAPTOR, RAGFlow 0.7 released","updated_at":"2024-09-20T17:09:26Z","url":"https://github.com/infiniflow/ragflow/releases/tag/v0.7.0"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"vissidarte_choi"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Agentic Workflow: What's inside <em>RAGFlow</em> v0.20.0"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://medium.com/@infiniflowai/agentic-workflow-whats-inside-<em>ragflow</em>-v0-20-0-789fdd4397f6"}},"_tags":["story","author_vissidarte_choi","story_44834725"],"author":"vissidarte_choi","created_at":"2025-08-08T08:14:25Z","created_at_i":1754640865,"num_comments":0,"objectID":"44834725","points":1,"story_id":44834725,"title":"Agentic Workflow: What's inside RAGFlow v0.20.0","updated_at":"2026-03-05T22:30:28Z","url":"https://medium.com/@infiniflowai/agentic-workflow-whats-inside-ragflow-v0-20-0-789fdd4397f6"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"vissidarte_choi"},"title":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Implementing Text2SQL with <em>RAGFlow</em> v0.10"},"url":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"https://medium.com/@infiniflowai/implementing-text2sql-with-<em>ragflow</em>-v0-10-710cda6c0683"}},"_tags":["story","author_vissidarte_choi","story_41623348"],"author":"vissidarte_choi","created_at":"2024-09-23T07:32:04Z","created_at_i":1727076724,"num_comments":0,"objectID":"41623348","points":1,"story_id":41623348,"title":"Implementing Text2SQL with RAGFlow v0.10","updated_at":"2024-09-23T07:37:24Z","url":"https://medium.com/@infiniflowai/implementing-text2sql-with-ragflow-v0-10-710cda6c0683"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"jjjutla"},"story_text":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Hey HN, I'm JJ, Co-Founder of Gecko Security (<a href=\"https://www.gecko.security\">https://www.gecko.security</a>). We're building a new kind of static analysis tool that uses LLMs to find complex business logic and multi-step vulnerabilities that current scanners miss. We\u2019ve used it to find 30+ CVEs in projects like Ollama, Gradio, and <em>Ragflow</em> (<a href=\"https://www.gecko.security/research\">https://www.gecko.security/research</a>). You can try it yourself on any OSS repo at (<a href=\"https://app.gecko.security\">https://app.gecko.security</a>).<p>Anyone who\u2019s used SAST (Static Application Security Testing) tools knows the issues of high false positives while missing entire classes of vulnerabilities like AuthN/Z bypasses or privilege escalations. This limitation is a result of their core architecture. By design, SAST tools parse code into a simplistic model like an AST or call graph, which quickly loses context in dynamically typed languages or across microservice boundaries, and limits coverage to only resolving basic call chains. When detecting vulnerabilities they rely on pattern matching with Regex or YAML rules, which can be effective for basic technical classes like (XSS, SQLi) but inadequate for logic flaws that don\u2019t conform to well-known shapes and need long sequences of dependent operations to reach an exploitable state.<p>My co-founder and I saw these limitations throughout our careers in national intelligence and military cyber forces, where we built automated tooling to defend critical infrastructure. We realised that LLMs, with the right architecture, could finally solve them.<p>Vulnerabilities are contextual. What's exploitable depends entirely on each application's security model. We realized accurate detection requires understanding what's supposed to be protected and why breaking it matters. This meant embedding threat modeling directly into our analysis, not treating it as an afterthought.<p>To achieve this, we first had to solve the code parsing problem. Our solution was to build a custom, compiler-accurate indexer inspired by GitHub's stack graphs approach to precisely navigate code, like an IDE. We build on the LSIF approach (<a href=\"https://lsif.dev/\" rel=\"nofollow\">https://lsif.dev/</a>) but replace the verbose JSON with a compact protobuf schema to serialise symbol definitions and references in a binary format. We use language\u2011specific tools to parse and type\u2011check code, emitting a sequence of Protobuf messages that record a symbol\u2019s position, definition, and reference information. By using Protobuf\u2019s efficiency and strong typing, we can produce smaller indexes, but also preserve the compiler\u2011accurate semantic information required for detecting complex call chains.<p>This is why most &quot;SAST + LLM&quot; tools that use AST parsing fail - they feed LLMs incomplete or incorrect code information from traditional parsers, making it difficult to accurately reason about security issues with missing context.<p>With our indexer providing accurate code structure, we use an LLM to perform threat modeling by analyzing developer intent, data and trust boundaries, and exposed endpoints to generate potential attack scenarios. This is where LLMs' tendency to hallucinate becomes a breakthrough feature.<p>For each potential attack path generated, we perform a systematic search, querying the indexer to gather all necessary context and reconstruct the full call chain from source to sink. To validate the vulnerability we use a Monte Carlo Tree Self-refine (MCTSr) algorithm and a 'win function' to determine the likelihood that a hypothesized attack could work. Once a finding is above a set practicality threshold it is confirmed as a true positive.<p>Using this approach, we discovered vulnerabilities like CVE-2025-51479 in ONYX (an OSS enterprise search platform) where Curators could modify any group instead of just their assigned ones. The user-group API had a user parameter that should check permissions but never used it. Gecko inferred developers intended to restrict Curator access because both the UI and similar API functions properly validated this permission. This established &quot;curators have limited scope&quot; as a security invariant that this specific API violated. Traditional SAST can't detect this. Any rule to flag unused user parameters would drown you in false positives since many functions legitimately keep unused parameters. And more importantly, detecting this requires knowing which functions handle authorization, understanding ONYX's Curator permission model, and recognizing the validation pattern across multiple files - contextual reasoning that SAST simply cannot do.<p>We have several enterprise customers using Gecko because it solves problems they couldn't address with traditional SAST tools. They're seeing 50% fewer false positives on the same codebases and finding vulnerabilities that previously only showed up in manual pentests.<p>Digging into false positives, no static analysis tool will ever achieve perfect accuracy, AI or otherwise. We reduce them at two key points. First, our indexer eliminates any programmatic parsing errors that create incorrect call chains that traditional AST tools are susceptible to. Second, we avoid unwanted LLM hallucinations and reasoning errors by asking specific, contextual questions rather than open-ended ones. The LLM knows which security invariants need to hold and can make deterministic assessments based on the context. When we do flag something, manual review is quick because we provide complete source-to-sink dataflow analysis with proof-of-concept code and output findings based on confidence scores.<p>We\u2019d love to get any feedback from the community, ideas for future direction, or experiences in this space. I\u2019ll be in the comments to respond!"},"title":{"matchLevel":"none","matchedWords":[],"value":"Launch HN: Gecko Security (YC F24) \u2013 AI That Finds Vulnerabilities in Code"}},"_tags":["story","author_jjjutla","story_44747204","launch_hn"],"author":"jjjutla","children":[44747541,44747575,44747637,44747798,44747850,44748209,44749661,44749725,44750727,44754393,44755199,44756271,44758207,44763730,44776137],"created_at":"2025-07-31T16:23:09Z","created_at_i":1753978989,"num_comments":36,"objectID":"44747204","points":66,"story_id":44747204,"story_text":"Hey HN, I&#x27;m JJ, Co-Founder of Gecko Security (<a href=\"https:&#x2F;&#x2F;www.gecko.security\">https:&#x2F;&#x2F;www.gecko.security</a>). We&#x27;re building a new kind of static analysis tool that uses LLMs to find complex business logic and multi-step vulnerabilities that current scanners miss. We\u2019ve used it to find 30+ CVEs in projects like Ollama, Gradio, and Ragflow (<a href=\"https:&#x2F;&#x2F;www.gecko.security&#x2F;research\">https:&#x2F;&#x2F;www.gecko.security&#x2F;research</a>). You can try it yourself on any OSS repo at (<a href=\"https:&#x2F;&#x2F;app.gecko.security\">https:&#x2F;&#x2F;app.gecko.security</a>).<p>Anyone who\u2019s used SAST (Static Application Security Testing) tools knows the issues of high false positives while missing entire classes of vulnerabilities like AuthN&#x2F;Z bypasses or privilege escalations. This limitation is a result of their core architecture. By design, SAST tools parse code into a simplistic model like an AST or call graph, which quickly loses context in dynamically typed languages or across microservice boundaries, and limits coverage to only resolving basic call chains. When detecting vulnerabilities they rely on pattern matching with Regex or YAML rules, which can be effective for basic technical classes like (XSS, SQLi) but inadequate for logic flaws that don\u2019t conform to well-known shapes and need long sequences of dependent operations to reach an exploitable state.<p>My co-founder and I saw these limitations throughout our careers in national intelligence and military cyber forces, where we built automated tooling to defend critical infrastructure. We realised that LLMs, with the right architecture, could finally solve them.<p>Vulnerabilities are contextual. What&#x27;s exploitable depends entirely on each application&#x27;s security model. We realized accurate detection requires understanding what&#x27;s supposed to be protected and why breaking it matters. This meant embedding threat modeling directly into our analysis, not treating it as an afterthought.<p>To achieve this, we first had to solve the code parsing problem. Our solution was to build a custom, compiler-accurate indexer inspired by GitHub&#x27;s stack graphs approach to precisely navigate code, like an IDE. We build on the LSIF approach (<a href=\"https:&#x2F;&#x2F;lsif.dev&#x2F;\" rel=\"nofollow\">https:&#x2F;&#x2F;lsif.dev&#x2F;</a>) but replace the verbose JSON with a compact protobuf schema to serialise symbol definitions and references in a binary format. We use language\u2011specific tools to parse and type\u2011check code, emitting a sequence of Protobuf messages that record a symbol\u2019s position, definition, and reference information. By using Protobuf\u2019s efficiency and strong typing, we can produce smaller indexes, but also preserve the compiler\u2011accurate semantic information required for detecting complex call chains.<p>This is why most &quot;SAST + LLM&quot; tools that use AST parsing fail - they feed LLMs incomplete or incorrect code information from traditional parsers, making it difficult to accurately reason about security issues with missing context.<p>With our indexer providing accurate code structure, we use an LLM to perform threat modeling by analyzing developer intent, data and trust boundaries, and exposed endpoints to generate potential attack scenarios. This is where LLMs&#x27; tendency to hallucinate becomes a breakthrough feature.<p>For each potential attack path generated, we perform a systematic search, querying the indexer to gather all necessary context and reconstruct the full call chain from source to sink. To validate the vulnerability we use a Monte Carlo Tree Self-refine (MCTSr) algorithm and a &#x27;win function&#x27; to determine the likelihood that a hypothesized attack could work. Once a finding is above a set practicality threshold it is confirmed as a true positive.<p>Using this approach, we discovered vulnerabilities like CVE-2025-51479 in ONYX (an OSS enterprise search platform) where Curators could modify any group instead of just their assigned ones. The user-group API had a user parameter that should check permissions but never used it. Gecko inferred developers intended to restrict Curator access because both the UI and similar API functions properly validated this permission. This established &quot;curators have limited scope&quot; as a security invariant that this specific API violated. Traditional SAST can&#x27;t detect this. Any rule to flag unused user parameters would drown you in false positives since many functions legitimately keep unused parameters. And more importantly, detecting this requires knowing which functions handle authorization, understanding ONYX&#x27;s Curator permission model, and recognizing the validation pattern across multiple files - contextual reasoning that SAST simply cannot do.<p>We have several enterprise customers using Gecko because it solves problems they couldn&#x27;t address with traditional SAST tools. They&#x27;re seeing 50% fewer false positives on the same codebases and finding vulnerabilities that previously only showed up in manual pentests.<p>Digging into false positives, no static analysis tool will ever achieve perfect accuracy, AI or otherwise. We reduce them at two key points. First, our indexer eliminates any programmatic parsing errors that create incorrect call chains that traditional AST tools are susceptible to. Second, we avoid unwanted LLM hallucinations and reasoning errors by asking specific, contextual questions rather than open-ended ones. The LLM knows which security invariants need to hold and can make deterministic assessments based on the context. When we do flag something, manual review is quick because we provide complete source-to-sink dataflow analysis with proof-of-concept code and output findings based on confidence scores.<p>We\u2019d love to get any feedback from the community, ideas for future direction, or experiences in this space. I\u2019ll be in the comments to respond!","title":"Launch HN: Gecko Security (YC F24) \u2013 AI That Finds Vulnerabilities in Code","updated_at":"2026-04-05T14:48:46Z"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"emmettm"},"story_text":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Hi HackerNews,<p>Lately, I have seen an explosion in posts offering paid APIs/services to get unstructured data into LLMs (i.e. langchain extract, <em>ragflow</em>, unstructured, unstract, just to name a few) and I have been largely disappointed by them, either because they fail to implement multimodal support, fail to give good context for &quot;really tricky&quot; PDFs / Word docs / Powerpoints, or are just plain difficult to use. In light of all these posts I figured I'd share my solution that has been working smoothly for me and my clients. I put it up on GitHub for free so you can check it out and hopefully offer some feedback / criticism or contribute to the code yourself.<p>and BTW, I'm not trying to throw shade at any of the services mentioned, I'm just giving my honest experience in case there are others out there who feel the same way and want something that works<p>Cheers!"},"title":{"matchLevel":"none","matchedWords":[],"value":"Show HN: I just open sourced my document/website extractor for Vision-LLMs"},"url":{"matchLevel":"none","matchedWords":[],"value":"https://github.com/emcf/thepipe"}},"_tags":["story","author_emmettm","story_39909351","show_hn"],"author":"emmettm","children":[39909381,39909478,39914376],"created_at":"2024-04-02T18:40:01Z","created_at_i":1712083201,"num_comments":4,"objectID":"39909351","points":37,"story_id":39909351,"story_text":"Hi HackerNews,<p>Lately, I have seen an explosion in posts offering paid APIs&#x2F;services to get unstructured data into LLMs (i.e. langchain extract, ragflow, unstructured, unstract, just to name a few) and I have been largely disappointed by them, either because they fail to implement multimodal support, fail to give good context for &quot;really tricky&quot; PDFs &#x2F; Word docs &#x2F; Powerpoints, or are just plain difficult to use. In light of all these posts I figured I&#x27;d share my solution that has been working smoothly for me and my clients. I put it up on GitHub for free so you can check it out and hopefully offer some feedback &#x2F; criticism or contribute to the code yourself.<p>and BTW, I&#x27;m not trying to throw shade at any of the services mentioned, I&#x27;m just giving my honest experience in case there are others out there who feel the same way and want something that works<p>Cheers!","title":"Show HN: I just open sourced my document/website extractor for Vision-LLMs","updated_at":"2024-09-20T16:44:44Z","url":"https://github.com/emcf/thepipe"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"StephenWalther"},"story_text":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Hi HN \u2014 I built Superexpert.AI, an open\u2011source platform that lets you spin up multi\u2011task AI agents in minutes without writing any code (and lets you extend everything later).<p><i>What it does</i><p>- Plug\u2011and\u2011play agents \u2013 Create agents from a web form. Each agent can contain multiple tasks, and each task can run a different AI model, use its own tools, and follow custom instructions.<p>- First\u2011class extensibility \u2013 Register a TypeScript function with registerServerTool, registerClientTool, or registerContextTool to add new functionality. If you want to share it, publish it as an NPM package and Superexpert.AI will auto\u2011detect it when installed.<p>- Built\u2011in RAG \u2013 Upload docs via the UI, or use a CLI that chunks 100 MB files, auto\u2011resumes after network errors, auto-resumes after network errors (e.g. uploading a 500-page PDF manual) and pipes the data into your agent.<p>- Launch a full chat app in minutes \u2013 Everything is MIT\u2011licensed NextJS + TypeScript + Tailwind + Postgres. Deploy like any other NextJS project.<p><i>Links</i><p>- Walkthrough (no sign\u2011up): <a href=\"https://app.arcade.software/share/yGqgrj65xp6y4mkDbNnT\" rel=\"nofollow\">https://app.arcade.software/share/yGqgrj65xp6y4mkDbNnT</a><p>- Live demo (email sign\u2011up): <a href=\"https://demo.superexpert.ai/\" rel=\"nofollow\">https://demo.superexpert.ai/</a><p>- GitHub repo: <a href=\"https://github.com/Superexpert/superexpert-ai\">https://github.com/Superexpert/superexpert-ai</a><p>- Quick\u2011start guide: <a href=\"https://superexpert.ai/docs/quick-start/\" rel=\"nofollow\">https://superexpert.ai/docs/quick-start/</a><p>- Full docs &amp; tutorials: <a href=\"https://superexpert.ai/\" rel=\"nofollow\">https://superexpert.ai/</a><p><i>Why I built it</i><p>I kept hand\u2011coding LangGraph\u2011style workflows for clients and wanted a web\u2011first, stack\u2011agnostic way to launch agents fast and stay fully modifiable. Superexpert.AI lets you extend or swap every layer \u2014 from models to tools to UI themes \u2014 with TypeScript.<p><i>Looking for feedback</i><p>1. Agent use\u2011cases you still have to hand\u2011code today.<p>2. Gaps in the <em>RAG flow</em> or model tooling that block production use.<p>Discord for deeper chat: <a href=\"https://discord.gg/wsrc3enWN3\" rel=\"nofollow\">https://discord.gg/wsrc3enWN3</a><p>\u2013\u2013 Stephen"},"title":{"matchLevel":"none","matchedWords":[],"value":"Show HN: Superexpert.ai \u2013 Open-source, no-code platform for multi-task AI agents"},"url":{"matchLevel":"none","matchedWords":[],"value":"https://superexpert.ai/"}},"_tags":["story","author_StephenWalther","story_43905537","show_hn"],"author":"StephenWalther","children":[43905646],"created_at":"2025-05-06T14:27:18Z","created_at_i":1746541638,"num_comments":1,"objectID":"43905537","points":3,"story_id":43905537,"story_text":"Hi HN \u2014 I built Superexpert.AI, an open\u2011source platform that lets you spin up multi\u2011task AI agents in minutes without writing any code (and lets you extend everything later).<p><i>What it does</i><p>- Plug\u2011and\u2011play agents \u2013 Create agents from a web form. Each agent can contain multiple tasks, and each task can run a different AI model, use its own tools, and follow custom instructions.<p>- First\u2011class extensibility \u2013 Register a TypeScript function with registerServerTool, registerClientTool, or registerContextTool to add new functionality. If you want to share it, publish it as an NPM package and Superexpert.AI will auto\u2011detect it when installed.<p>- Built\u2011in RAG \u2013 Upload docs via the UI, or use a CLI that chunks 100 MB files, auto\u2011resumes after network errors, auto-resumes after network errors (e.g. uploading a 500-page PDF manual) and pipes the data into your agent.<p>- Launch a full chat app in minutes \u2013 Everything is MIT\u2011licensed NextJS + TypeScript + Tailwind + Postgres. Deploy like any other NextJS project.<p><i>Links</i><p>- Walkthrough (no sign\u2011up): <a href=\"https:&#x2F;&#x2F;app.arcade.software&#x2F;share&#x2F;yGqgrj65xp6y4mkDbNnT\" rel=\"nofollow\">https:&#x2F;&#x2F;app.arcade.software&#x2F;share&#x2F;yGqgrj65xp6y4mkDbNnT</a><p>- Live demo (email sign\u2011up): <a href=\"https:&#x2F;&#x2F;demo.superexpert.ai&#x2F;\" rel=\"nofollow\">https:&#x2F;&#x2F;demo.superexpert.ai&#x2F;</a><p>- GitHub repo: <a href=\"https:&#x2F;&#x2F;github.com&#x2F;Superexpert&#x2F;superexpert-ai\">https:&#x2F;&#x2F;github.com&#x2F;Superexpert&#x2F;superexpert-ai</a><p>- Quick\u2011start guide: <a href=\"https:&#x2F;&#x2F;superexpert.ai&#x2F;docs&#x2F;quick-start&#x2F;\" rel=\"nofollow\">https:&#x2F;&#x2F;superexpert.ai&#x2F;docs&#x2F;quick-start&#x2F;</a><p>- Full docs &amp; tutorials: <a href=\"https:&#x2F;&#x2F;superexpert.ai&#x2F;\" rel=\"nofollow\">https:&#x2F;&#x2F;superexpert.ai&#x2F;</a><p><i>Why I built it</i><p>I kept hand\u2011coding LangGraph\u2011style workflows for clients and wanted a web\u2011first, stack\u2011agnostic way to launch agents fast and stay fully modifiable. Superexpert.AI lets you extend or swap every layer \u2014 from models to tools to UI themes \u2014 with TypeScript.<p><i>Looking for feedback</i><p>1. Agent use\u2011cases you still have to hand\u2011code today.<p>2. Gaps in the RAG flow or model tooling that block production use.<p>Discord for deeper chat: <a href=\"https:&#x2F;&#x2F;discord.gg&#x2F;wsrc3enWN3\" rel=\"nofollow\">https:&#x2F;&#x2F;discord.gg&#x2F;wsrc3enWN3</a><p>\u2013\u2013 Stephen","title":"Show HN: Superexpert.ai \u2013 Open-source, no-code platform for multi-task AI agents","updated_at":"2025-05-07T06:24:49Z","url":"https://superexpert.ai/"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"ZeroAurora"},"story_text":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Once again I'm seeing an agent development platform in GitHub Trending. Dify, <em>RAGFlow</em>, Flowise, Sim, Coze, countless to name, yet implementing the exact same goal. And there are still more emerging.<p>It seems like anything AI can be a trending, despite their repetitive works."},"title":{"matchLevel":"none","matchedWords":[],"value":"Ask HN: Why are there always new agent platforms?"}},"_tags":["story","author_ZeroAurora","story_46578498","ask_hn"],"author":"ZeroAurora","children":[46580727],"created_at":"2026-01-11T18:49:46Z","created_at_i":1768157386,"num_comments":1,"objectID":"46578498","points":1,"story_id":46578498,"story_text":"Once again I&#x27;m seeing an agent development platform in GitHub Trending. Dify, RAGFlow, Flowise, Sim, Coze, countless to name, yet implementing the exact same goal. And there are still more emerging.<p>It seems like anything AI can be a trending, despite their repetitive works.","title":"Ask HN: Why are there always new agent platforms?","updated_at":"2026-03-05T23:21:24Z"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"Norcim133"},"comment_text":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Correct-ish. LlamaCloud and GroundX do everything up to retrieval. Here is an interactive graphic of major players along <em>RAG flow</em>: <a href=\"https://claude.ai/public/artifacts/b872435b-1d9c-461e-a29c-b03d252053a0\" rel=\"nofollow\">https://claude.ai/public/artifacts/b872435b-1d9c-461e-a29c-b...</a>"},"story_title":{"matchLevel":"none","matchedWords":[],"value":"Ask HN: Who is doing the best Word/PDF RAG tool with deep research?"}},"_tags":["comment","author_Norcim133","story_44641721"],"author":"Norcim133","comment_text":"Correct-ish. LlamaCloud and GroundX do everything up to retrieval. Here is an interactive graphic of major players along RAG flow: <a href=\"https:&#x2F;&#x2F;claude.ai&#x2F;public&#x2F;artifacts&#x2F;b872435b-1d9c-461e-a29c-b03d252053a0\" rel=\"nofollow\">https:&#x2F;&#x2F;claude.ai&#x2F;public&#x2F;artifacts&#x2F;b872435b-1d9c-461e-a29c-b...</a>","created_at":"2025-07-22T19:36:53Z","created_at_i":1753213013,"objectID":"44652021","parent_id":44642748,"story_id":44641721,"story_title":"Ask HN: Who is doing the best Word/PDF RAG tool with deep research?","updated_at":"2025-07-22T19:41:26Z"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"aliasmaya"},"comment_text":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Seems that you're looking for a RAG System, and you may have a try <em>RAGFlow</em>"},"story_title":{"matchLevel":"none","matchedWords":[],"value":"Is there a way to run an LLM as a better local search engine?"}},"_tags":["comment","author_aliasmaya","story_44307466"],"author":"aliasmaya","children":[44308682],"comment_text":"Seems that you&#x27;re looking for a RAG System, and you may have a try RAGFlow","created_at":"2025-06-18T08:10:49Z","created_at_i":1750234249,"objectID":"44307724","parent_id":44307466,"story_id":44307466,"story_title":"Is there a way to run an LLM as a better local search engine?","updated_at":"2025-06-18T15:58:44Z"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"simple10"},"comment_text":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"Congrats on the launch! Looking forward to playing with it.<p>Do you mind elaborating on what differentiates Sim Studio from n8n, Flowise, <em>RAGFlow</em> and other open source flow based AI automation platforms?"},"story_title":{"matchLevel":"none","matchedWords":[],"value":"Show HN: Sim Studio \u2013 Open-Source Agent Workflow GUI"},"story_url":{"matchLevel":"none","matchedWords":[],"value":"https://github.com/simstudioai/sim"}},"_tags":["comment","author_simple10","story_43823096"],"author":"simple10","children":[43824445],"comment_text":"Congrats on the launch! Looking forward to playing with it.<p>Do you mind elaborating on what differentiates Sim Studio from n8n, Flowise, RAGFlow and other open source flow based AI automation platforms?","created_at":"2025-04-28T18:01:02Z","created_at_i":1745863262,"objectID":"43824178","parent_id":43823096,"story_id":43823096,"story_title":"Show HN: Sim Studio \u2013 Open-Source Agent Workflow GUI","story_url":"https://github.com/simstudioai/sim","updated_at":"2025-04-30T00:06:43Z"},{"_highlightResult":{"author":{"matchLevel":"none","matchedWords":[],"value":"yingfeng"},"comment_text":{"fullyHighlighted":false,"matchLevel":"full","matchedWords":["ragflow"],"value":"<em>RAGFlow</em> v0.17.0 now enables Agentic Reasoning for Deep Research, integrating any LLM \u2014 no RLM dependency required."},"story_title":{"matchLevel":"none","matchedWords":[],"value":"[dead]"}},"_tags":["comment","author_yingfeng","story_43253353"],"author":"yingfeng","comment_text":"RAGFlow v0.17.0 now enables Agentic Reasoning for Deep Research, integrating any LLM \u2014 no RLM dependency required.","created_at":"2025-03-04T11:43:52Z","created_at_i":1741088632,"objectID":"43253354","parent_id":43253353,"story_id":43253353,"story_title":"[dead]","updated_at":"2025-03-04T11:48:59Z"}],"hitsPerPage":20,"nbHits":3936,"nbPages":50,"page":0,"params":"query=ragflow&advancedSyntax=true&analyticsTags=backend","processingTimeMS":12,"processingTimingsMS":{"_request":{"queue":14,"roundTrip":22},"afterFetch":{"format":{"total":1},"merge":{"mergeLoop":{"prepareNextHit":5,"total":5},"total":5},"total":5},"fetch":{"query":5,"total":6},"total":12},"query":"ragflow","serverTimeMS":27}