{"id":6399,"date":"2025-10-18T11:18:39","date_gmt":"2025-10-18T03:18:39","guid":{"rendered":"https:\/\/nullthought.net\/?p=6399"},"modified":"2025-10-18T11:18:40","modified_gmt":"2025-10-18T03:18:40","slug":"reducto-%e4%b8%8e-rag-anything-%e7%9a%84%e6%af%94%e8%be%83%e4%b8%8e%e5%88%86%e6%9e%90","status":"publish","type":"post","link":"https:\/\/nullthought.net\/?p=6399","title":{"rendered":"Reducto \u4e0e RAG-Anything \u7684\u6bd4\u8f83\u4e0e\u5206\u6790"},"content":{"rendered":"\n<p><strong><a href=\"https:\/\/nullthought.net\/?p=6350\" target=\"_blank\" rel=\"noreferrer noopener\">Reducto <\/a><\/strong>\u548c <strong><a href=\"https:\/\/nullthought.net\/?p=6393\" target=\"_blank\" rel=\"noreferrer noopener\">RAG-Anything<\/a><\/strong> \u90fd\u5229\u7528<a href=\"https:\/\/nullthought.net\/?p=4920\" target=\"_blank\" rel=\"noreferrer noopener\">\u89c6\u89c9-\u8bed\u8a00\u6a21\u578b\uff08VLM\uff09<\/a>\u6765\u589e\u5f3a\u5bf9\u591a\u6a21\u6001\u6587\u6863\u7684\u7406\u89e3\uff0c\u786e\u4fdd\u56fe\u50cf\u3001\u8868\u683c\u7b49\u975e\u6587\u672c\u5185\u5bb9\u88ab\u8f6c\u5316\u4e3a <strong>LLM-ready<\/strong> \u7684\u6570\u636e \u6216\u6574\u5408\u4e3a\u4e0a\u4e0b\u6587\u4ee5\u63d0\u4f9b\u66f4\u6df1\u5165\u7684\u6d1e\u5bdf\u3002\u7136\u800c\uff0c\u4e24\u8005\u5728\u67b6\u6784\u3001\u76ee\u7684\u548c VLM \u5b9e\u65bd\u91cd\u70b9\u4e0a\u5b58\u5728\u663e\u8457\u5dee\u5f02\u3002<\/p>\n\n\n\n<figure class=\"wp-block-gallery has-nested-images columns-default is-cropped wp-block-gallery-1 is-layout-flex wp-block-gallery-is-layout-flex\">\n<figure class=\"wp-block-image size-large\"><img loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"480\" data-id=\"6400\" src=\"https:\/\/nullthought.net\/wp-content\/uploads\/2025\/10\/RAG-Anything.jpg\" alt=\"\" class=\"wp-image-6400\" srcset=\"https:\/\/nullthought.net\/wp-content\/uploads\/2025\/10\/RAG-Anything.jpg 1024w, https:\/\/nullthought.net\/wp-content\/uploads\/2025\/10\/RAG-Anything-300x141.jpg 300w, https:\/\/nullthought.net\/wp-content\/uploads\/2025\/10\/RAG-Anything-768x360.jpg 768w\" sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n\n\n\n<figure class=\"wp-block-image size-large\"><img loading=\"lazy\" decoding=\"async\" width=\"1024\" height=\"476\" data-id=\"6401\" src=\"https:\/\/nullthought.net\/wp-content\/uploads\/2025\/10\/reducto.jpg\" alt=\"\" class=\"wp-image-6401\" srcset=\"https:\/\/nullthought.net\/wp-content\/uploads\/2025\/10\/reducto.jpg 1024w, https:\/\/nullthought.net\/wp-content\/uploads\/2025\/10\/reducto-300x139.jpg 300w, https:\/\/nullthought.net\/wp-content\/uploads\/2025\/10\/reducto-768x357.jpg 768w\" sizes=\"auto, (max-width: 1024px) 100vw, 1024px\" \/><\/figure>\n<figcaption class=\"blocks-gallery-caption wp-element-caption\">Reducto \u4e0e RAG-Anything \u7684\u6bd4\u8f83\uff08\u56fe\u7247\u7531NotebookLM\u751f\u6210\uff09<\/figcaption><\/figure>\n\n\n\n<h3 class=\"wp-block-heading\">1. \u67b6\u6784\u7126\u70b9\u4e0e\u7cfb\u7edf\u6027\u8d28<\/h3>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><tbody><tr><th>\u7279\u6027 (Feature)<\/th><th>Reducto<\/th><th>RAG-Anything<\/th><\/tr><tr><td><strong>\u6027\u8d28 (Nature)<\/strong><\/td><td><strong>\u5546\u4e1a\u4ea7\u54c1\/\u670d\u52a1<\/strong>\uff0c\u88ab\u63cf\u8ff0\u4e3a\u201cAI \u6587\u6863\u89e3\u6790\u548c\u63d0\u53d6\u8f6f\u4ef6\u201d\uff0c\u901a\u8fc7\u7075\u6d3b\u7684 API \u63d0\u4f9b\uff0c\u9762\u5411\u751f\u4ea7\u73af\u5883\u7684 AI\u3002<\/td><td><strong>\u5f00\u6e90 RAG \u6846\u67b6<\/strong>\uff0c\u662f\u5efa\u7acb\u5728 LightRAG \u4e4b\u4e0a\u7684\u201c<strong>\u4e00\u4f53\u5316\u591a\u6a21\u6001\u6587\u6863\u5904\u7406 RAG \u7cfb\u7edf<\/strong>\u201d\u3002<\/td><\/tr><tr><td><strong>\u6838\u5fc3\u6d41\u7a0b (Core Pipeline)<\/strong><\/td><td>\u4f7f\u7528\u591a\u7a0b\uff08multi-pass\uff09\u7cfb\u7edf\uff1a\u9996\u5148\u662f<strong>\u4f20\u7edf\u8ba1\u7b97\u673a\u89c6\u89c9<\/strong>\uff08CV\uff09\u8fdb\u884c\u6587\u6863\u5206\u89e3\uff0c\u7136\u540e\u662f VLM \u89e3\u91ca\uff0c\u4ee5\u53ca VLM\/Agentic \u6a21\u578b\u8fdb\u884c\u6821\u6b63\u3002<\/td><td>\u5b9e\u65bd<strong>\u591a\u9636\u6bb5\u591a\u6a21\u6001\u6d41\u6c34\u7ebf<\/strong>\uff1a\u6587\u6863\u89e3\u6790 \u2192 \u5185\u5bb9\u5206\u6790 \u2192 \u77e5\u8bc6\u56fe\u8c31 \u2192 \u667a\u80fd\u68c0\u7d22\u3002<\/td><\/tr><tr><td><strong>\u4f01\u4e1a\u5c31\u7eea\u6027 (Enterprise Readiness)<\/strong><\/td><td>\u4e13\u4e3a\u751f\u4ea7 AI \u800c\u8bbe\u8ba1\uff0c\u83b7\u5f97\u8d22\u5bcc 10 \u5f3a\u4f01\u4e1a\u7684\u4fe1\u4efb\uff0c\u5177\u5907 <strong>99.9%+ \u8fd0\u884c\u65f6\u95f4<\/strong>\u3001\u4f01\u4e1a\u7ea7\u652f\u6301\u3001\u4ee5\u53ca <strong>SOC2 \u548c HIPAA \u5408\u89c4<\/strong>\u8ba4\u8bc1\u3002\u53ef\u5b8c\u5168\u90e8\u7f72\u5728\u7528\u6237\u81ea\u5df1\u7684\u57fa\u7840\u8bbe\u65bd\u5185\u3002<\/td><td>\u4e13\u6ce8\u4e8e\u63d0\u4f9b\u7075\u6d3b\u7684 RAG \u6846\u67b6\u3002\u8981\u6c42\u7528\u6237\u81ea\u884c\u914d\u7f6e\u4f9d\u8d56\u9879\uff08\u4f8b\u5982\uff0c\u5904\u7406 Office \u6587\u6863\u9700\u8981 <strong>LibreOffice<\/strong>\uff09\u548c\u5916\u90e8\u6a21\u578b\uff08\u4f8b\u5982\uff0c\u9700\u8981\u914d\u7f6e <code>vision_model_func<\/code> \u4ee5\u4f7f\u7528 <strong>GPT-4o<\/strong> \u7b49 VLM\uff09\u3002<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<h3 class=\"wp-block-heading\">2. VLM \u5229\u7528\u4e0e\u591a\u6a21\u6001\u5904\u7406<\/h3>\n\n\n\n<h4 class=\"wp-block-heading\">Reducto \u7684 VLM \u65b9\u6cd5\uff1a\u6821\u6b63\u4e0e\u89e3\u91ca<\/h4>\n\n\n\n<p>Reducto \u7684\u7cfb\u7edf\u4e3b\u8981\u5728\u6587\u6863\u63d0\u53d6\u7684<strong>\u5185\u5bb9\u5206\u6790\u548c\u7ec6\u5316<\/strong>\u9636\u6bb5\u4f7f\u7528 VLM\u3002<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li><strong>\u5e03\u5c40\u5206\u5272\uff08CV \u4f18\u5148\uff09\uff1a<\/strong> \u4f20\u7edf\u8ba1\u7b97\u673a\u89c6\u89c9\u6a21\u578b\u9996\u5148\u4ece\u89c6\u89c9\u4e0a\u5206\u89e3\u6587\u6863\uff0c\u6355\u83b7\u533a\u57df\u3001\u8868\u683c\u3001\u56fe\u5f62\u548c\u6587\u672c\u3002<\/li>\n\n\n\n<li><strong>\u4e0a\u4e0b\u6587\u89e3\u91ca\uff08VLM\uff09\uff1a<\/strong> VLM \u968f\u540e\u5728<strong>\u4e0a\u4e0b\u6587<\/strong>\u4e2d\u89e3\u91ca\u6bcf\u4e2a\u8bc6\u522b\u51fa\u7684\u533a\u57df\uff0c\u8fdb\u884c\u8bf8\u5982\u5c06\u6807\u7b7e\u94fe\u63a5\u5230\u6570\u503c\u3001\u7406\u89e3\u8868\u683c\u548c\u5206\u7c7b\u6bb5\u843d\u7684\u4efb\u52a1\u3002<\/li>\n\n\n\n<li><strong>\u51c6\u786e\u6027\u589e\u5f3a\uff08Agentic \u6a21\u578b\/VLM\uff09\uff1a<\/strong> Reducto \u5177\u6709\u4e00\u4e2a<strong>Agentic \u6a21\u578b<\/strong>\uff0c\u5b83\u80fd\u68c0\u6d4b\u5e76\u7ea0\u6b63\u7ec6\u5fae\u9519\u8bef\uff0c\u201c\u50cf\u4eba\u7c7b\u7f16\u8f91\u4e00\u6837\u201d\u5de5\u4f5c\uff0c\u786e\u4fdd\u5728\u6700\u8be6\u7ec6\u7684\u6848\u4f8b\u4e2d\u4e5f\u80fd\u4fdd\u8bc1\u51c6\u786e\u6027\u3002Reducto \u7684\u76ee\u6807\u662f\u4ea7\u751f<strong>\u6700\u51c6\u786e\u3001LLM-ready \u7684\u7ed3\u679c<\/strong>\u3002<\/li>\n<\/ol>\n\n\n\n<h4 class=\"wp-block-heading\">RAG-Anything \u7684 VLM \u65b9\u6cd5\uff1a\u67e5\u8be2\u548c\u5173\u7cfb\u5efa\u6a21<\/h4>\n\n\n\n<p>RAG-Anything \u5728\u5185\u5bb9\u5904\u7406\u9636\u6bb5\u548c\u68c0\u7d22\u67e5\u8be2\u9636\u6bb5\u90fd\u4f7f\u7528\u4e86 VLM\uff1a<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li><strong>\u5185\u5bb9\u5206\u6790\u5668\uff08Visual Content Analyzer\uff09\uff1a<\/strong> \u4e13\u7528\u7684<strong>\u89c6\u89c9\u5185\u5bb9\u5206\u6790\u5668<\/strong>\u96c6\u6210\u4e86\u89c6\u89c9\u6a21\u578b\uff0c\u6839\u636e\u89c6\u89c9\u8bed\u4e49\u751f\u6210<strong>\u4e0a\u4e0b\u6587\u611f\u77e5<\/strong>\u7684\u63cf\u8ff0\u6027\u8bf4\u660e\u6587\u5b57\uff08captions\uff09\u3002<\/li>\n\n\n\n<li><strong>\u589e\u5f3a\u67e5\u8be2\uff08VLM-Enhanced Query Mode\uff09\uff1a<\/strong> RAG-Anything \u73b0\u5df2\u63a8\u51fa <strong>VLM \u589e\u5f3a\u67e5\u8be2<\/strong>\u6a21\u5f0f\u3002\u5f53\u67e5\u8be2\u5305\u542b\u56fe\u50cf\u7684\u6587\u6863\u65f6\uff0c\u7cfb\u7edf\u4f1a\u81ea\u52a8\uff1a\n<ul class=\"wp-block-list\">\n<li>\u68c0\u7d22\u5305\u542b\u56fe\u50cf\u8def\u5f84\u7684\u76f8\u5173\u4e0a\u4e0b\u6587\u3002<\/li>\n\n\n\n<li>\u52a0\u8f7d\u5e76\u5c06\u56fe\u50cf\u7f16\u7801\u4e3a Base64 \u683c\u5f0f\u3002<\/li>\n\n\n\n<li>\u5c06\u6587\u672c\u4e0a\u4e0b\u6587\u548c\u56fe\u50cf\u4e00\u8d77\u53d1\u9001\u7ed9 VLM (\u4f8b\u5982\uff0c\u914d\u7f6e\u4e3a <strong>GPT-4o<\/strong>)\uff0c\u8fdb\u884c<strong>\u7efc\u5408\u591a\u6a21\u6001\u5206\u6790<\/strong>\uff0c\u4ece\u800c\u7ed3\u5408\u89c6\u89c9\u548c\u6587\u672c\u4e0a\u4e0b\u6587\u4ee5\u83b7\u5f97\u66f4\u6df1\u5165\u7684\u89c1\u89e3\u3002\u7528\u6237\u53ef\u4ee5\u624b\u52a8\u6216\u81ea\u52a8\u63a7\u5236\u6b64 VLM \u589e\u5f3a\u529f\u80fd\u3002<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li><strong>\u591a\u6a21\u6001\u77e5\u8bc6\u56fe\u8c31\uff1a<\/strong> RAG-Anything \u901a\u8fc7<strong>\u591a\u6a21\u6001\u77e5\u8bc6\u56fe\u8c31\u7d22\u5f15<\/strong>\u5c06\u6587\u6863\u5185\u5bb9\u8f6c\u5316\u4e3a\u7ed3\u6784\u5316\u8bed\u4e49\u8868\u793a\u3002\u8be5\u8fc7\u7a0b\u6d89\u53ca<strong>\u8de8\u6a21\u6001\u5173\u7cfb\u6620\u5c04<\/strong>\uff0c\u4ee5\u5efa\u7acb\u6587\u672c\u5b9e\u4f53\u4e0e\u591a\u6a21\u6001\u7ec4\u4ef6\u4e4b\u95f4\u7684\u8bed\u4e49\u8fde\u63a5\u548c\u4f9d\u8d56\u5173\u7cfb\u3002<\/li>\n<\/ol>\n\n\n\n<h3 class=\"wp-block-heading\">3. \u8f93\u51fa\u7ed3\u6784\u4e0e\u5185\u5bb9\u8303\u56f4<\/h3>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><tbody><tr><th>\u7279\u6027 (Feature)<\/th><th>Reducto<\/th><th>RAG-Anything<\/th><\/tr><tr><td><strong>\u6570\u636e\u7ed3\u6784\u5316<\/strong><\/td><td>\u4e13\u6ce8\u4e8e <strong>LLM \u4f18\u5316<\/strong>\uff0c\u5305\u62ec<strong>\u667a\u80fd\u5206\u5757<\/strong> (Intelligent chunking)\u3001<strong>\u56fe\u8868\u603b\u7ed3<\/strong> (Figure summarization)\u3001<strong>\u56fe\u8868\u63d0\u53d6<\/strong> (Graph extraction) \u548c<strong>\u5d4c\u5165\u4f18\u5316<\/strong> (Embedding optimization)\u3002<\/td><td>\u4e13\u6ce8\u4e8e<strong>\u591a\u6a21\u6001\u77e5\u8bc6\u56fe\u8c31<\/strong>\uff0c\u901a\u8fc7<strong>\u591a\u6a21\u6001\u5b9e\u4f53\u63d0\u53d6<\/strong>\u548c<strong>\u8de8\u6a21\u6001\u5173\u7cfb\u6620\u5c04<\/strong>\u6765\u7ef4\u62a4\u5185\u5bb9\u95f4\u7684\u8bed\u4e49\u548c\u7ed3\u6784\u5173\u7cfb\u3002<\/td><\/tr><tr><td><strong>\u652f\u6301\u5185\u5bb9<\/strong><\/td><td>\u652f\u6301 <strong>PDFs<\/strong>\u3001<strong>\u56fe\u50cf<\/strong>\u3001<strong>\u7535\u5b50\u8868\u683c<\/strong>\u3001<strong>\u5e7b\u706f\u7247<\/strong>\u7b49\u6587\u4ef6\u7c7b\u578b\u3002\u53ef\u5904\u7406\u590d\u6742\u7684\u6587\u6863\uff0c\u5982\u6295\u8d44\u8005\u8d44\u6599\u3001SEC \u6587\u4ef6\u3001\u590d\u6742\u7684\u8868\u683c\u3001\u56fe\u8868\u548c\u8d22\u52a1\u62a5\u8868\u3002<\/td><td>\u652f\u6301 <strong>PDFs<\/strong>\u3001<strong>Office \u6587\u6863<\/strong>\uff08DOC\/DOCX\/PPT\/PPTX\/XLS\/XLSX\uff09\u3001<strong>\u56fe\u50cf<\/strong>\u548c<strong>\u6587\u672c\u6587\u4ef6<\/strong>\uff08TXT\/MD\uff09\u3002\u5177\u6709\u9488\u5bf9<strong>\u56fe\u50cf<\/strong>\u3001<strong>\u8868\u683c<\/strong>\u548c<strong>\u6570\u5b66\u516c\u5f0f<\/strong>\uff08\u652f\u6301<strong>\u539f\u751f LaTeX \u683c\u5f0f<\/strong>\uff09\u7684\u4e13\u7528\u5185\u5bb9\u5904\u7406\u5668\u3002<\/td><\/tr><tr><td><strong>\u8bed\u8a00\u652f\u6301<\/strong><\/td><td>\u63d0\u4f9b\u8d85\u8fc7 <strong>100 \u79cd\u8bed\u8a00<\/strong>\u7684\u591a\u8bed\u8a00\u89e3\u6790\u3002<\/td><td>\uff08\u6765\u6e90\u672a\u660e\u786e\u63d0\u53ca\u5e7f\u6cdb\u7684\u591a\u8bed\u8a00\u652f\u6301\u8303\u56f4\uff0c\u4f46 MinerU \u89e3\u6790\u5668\u652f\u6301\u8bbe\u7f6e <code>lang<\/code> \u53c2\u6570\u8fdb\u884c OCR \u4f18\u5316\uff0c\u4f8b\u5982\u201cch\u201d\u6216\u201cja\u201d\u3002\uff09<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<h2 class=\"wp-block-heading\">\u8be6\u7ec6\u5206\u6790<\/h2>\n\n\n\n<p><strong>Reducto \u7684\u4f18\u52bf\uff1a\u51c6\u786e\u6027\u548c\u751f\u4ea7\u5c31\u7eea\u6027<\/strong><\/p>\n\n\n\n<p>Reducto \u9488\u5bf9\u9700\u8981\u6781\u9ad8\u51c6\u786e\u6027\u7684\u9ad8\u4ef7\u503c\u3001\u9ad8\u541e\u5410\u91cf\u7684\u751f\u4ea7\u73af\u5883\uff08\u5982<strong>\u91d1\u878d\u3001\u533b\u7597\u3001\u6cd5\u5f8b<\/strong>\uff09\u8fdb\u884c\u4e86\u4f18\u5316\u3002\u5176\u8bbe\u8ba1\u6d41\u7a0b\u2014\u2014\u5148\u8fdb\u884c CV \u89e3\u6790\uff0c\u518d\u8fdb\u884c VLM \u89e3\u91ca\u548c Agentic \u6a21\u578b\u6821\u6b63\u2014\u2014\u8868\u660e\u5b83\u662f\u4e00\u4e2a\u65e8\u5728\u6700\u5927\u9650\u5ea6\u51cf\u5c11\u63d0\u53d6\u9519\u8bef\u7684\u5f3a\u5927\u7cfb\u7edf\u3002\u5b83\u660e\u786e\u5f3a\u8c03\u4f01\u4e1a\u7ea7\u529f\u80fd\uff0c\u5982\u5b89\u5168\u5408\u89c4\u6027 (<strong>SOC2, HIPAA<\/strong>) \u548c\u7075\u6d3b\u7684\u90e8\u7f72\u9009\u9879\uff08\u53ef\u5728\u7528\u6237\u81ea\u5df1\u7684\u57fa\u7840\u8bbe\u65bd\u4e2d\u8fd0\u884c\uff09\uff0c\u4f7f\u5176\u6210\u4e3a\u5bfb\u6c42\u53ef\u9760 API \u670d\u52a1\u7684\u6210\u719f\u7ec4\u7ec7\u7684\u9996\u9009\u3002<\/p>\n\n\n\n<p><strong>RAG-Anything \u7684\u4f18\u52bf\uff1a\u8bed\u4e49\u6df1\u5ea6\u548c\u7075\u6d3b\u6027<\/strong><\/p>\n\n\n\n<p>RAG-Anything \u7684\u6838\u5fc3\u4f18\u52bf\u5728\u4e8e\u5176 <strong>All-in-One<\/strong> RAG \u6846\u67b6\u65b9\u6cd5 \u548c\u5148\u8fdb\u7684<strong>\u8bed\u4e49\u7ed3\u6784\u5316<\/strong>\u80fd\u529b\u3002\u901a\u8fc7\u6784\u5efa<strong>\u591a\u6a21\u6001\u77e5\u8bc6\u56fe\u8c31<\/strong>\uff0c\u5b83\u8d85\u8d8a\u4e86\u7b80\u5355\u7684\u5206\u5757\u6216\u603b\u7ed3\uff0c\u660e\u786e\u5730\u5bf9\u4e0d\u540c\u6a21\u6001\uff08\u6587\u672c\u3001\u56fe\u50cf\u3001\u8868\u683c\u3001\u516c\u5f0f\uff09\u4e4b\u95f4\u7684\u5173\u7cfb\u8fdb\u884c\u5efa\u6a21\u3002\u8fd9\u79cd\u5173\u7cfb\u4e00\u81f4\u6027\u5728\u68c0\u7d22\u8fc7\u7a0b\u4e2d\u5f97\u4ee5\u4fdd\u6301\uff0c\u786e\u4fdd\u4fe1\u606f\u4f20\u9012\u662f\u4e0a\u4e0b\u6587\u6574\u5408\u7684\u3002\u6b64\u5916\uff0c<strong>VLM \u589e\u5f3a\u67e5\u8be2\u6a21\u5f0f<\/strong> \u5141\u8bb8\u5728\u67e5\u8be2\u9636\u6bb5\u5bf9\u68c0\u7d22\u5230\u7684\u89c6\u89c9\u5185\u5bb9\u8fdb\u884c\u52a8\u6001\u3001\u5b9e\u65f6\u7684 VLM \u5206\u6790\uff0c\u8fd9\u5bf9\u4e8e\u9700\u8981 VLM \u5728\u4e0a\u4e0b\u6587\u4e2d\u5bf9\u56fe\u8868\u8fdb\u884c\u5373\u65f6\u89e3\u91ca\u7684\u7528\u4f8b\u975e\u5e38\u6709\u7528\u3002\u5b83\u8fd8\u652f\u6301\u76f4\u63a5\u63d2\u5165\u9884\u89e3\u6790\u7684\u5185\u5bb9\u5217\u8868\uff0c\u63d0\u4f9b\u4e86\u9ad8\u5ea6\u7684\u7075\u6d3b\u6027\u548c\u53ef\u5b9a\u5236\u6027\u3002<\/p>\n\n\n\n<h2 class=\"wp-block-heading\">\u5e94\u7528\u5efa\u8bae<\/h2>\n\n\n\n<p>\u9009\u62e9 Reducto \u8fd8\u662f RAG-Anything \u4e3b\u8981\u53d6\u51b3\u4e8e\u7528\u6237\u7684\u64cd\u4f5c\u73af\u5883\u3001\u6280\u672f\u8981\u6c42\u548c\u6700\u7ec8\u76ee\u6807\uff1a<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">Reducto \u63a8\u8350\u573a\u666f<\/h3>\n\n\n\n<p>\u5982\u679c\u7528\u6237\u9700\u8981\u6ee1\u8db3\u4ee5\u4e0b\u6761\u4ef6\uff0c\u5219\u63a8\u8350\u4f7f\u7528 Reducto\uff1a<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li><strong>\u6781\u9ad8\u7684\u63d0\u53d6\u51c6\u786e\u6027\uff1a<\/strong> \u4e3b\u8981\u76ee\u6807\u662f\u4ece\u590d\u6742\u6587\u6863\uff08\u5982\u8d22\u52a1\u62a5\u544a\u6216\u6cd5\u5f8b\u6587\u4ef6\uff09\u4e2d\u63d0\u53d6\u9ad8\u5ea6\u53ef\u9760\u7684\u7ed3\u6784\u5316\u6570\u636e\uff0c\u5176\u4e2d\u5fae\u5c0f\u7684\u89e3\u6790\u9519\u8bef\u4ee3\u4ef7\u9ad8\u6602\u3002<\/li>\n\n\n\n<li><strong>\u4f01\u4e1a\u7ea7\u751f\u4ea7\u8981\u6c42\uff1a<\/strong> \u5e94\u7528\u9700\u8981\u9ad8\u53ef\u7528\u6027 (<strong>99.9%+ uptime<\/strong>)\u3001\u4e25\u683c\u7684\u5b89\u5168\u5408\u89c4\u6027 (<strong>HIPAA, SOC2<\/strong>)\uff0c\u6216\u9700\u8981\u5728\u79c1\u6709\u73af\u5883\u4e2d\u90e8\u7f72\u3002<\/li>\n\n\n\n<li><strong>\u504f\u597d API \u96c6\u6210\uff1a<\/strong> \u7528\u6237\u503e\u5411\u4e8e\u96c6\u6210\u4e00\u4e2a\u7ecf\u8fc7\u7ba1\u7406\u3001\u5177\u5907\u670d\u52a1\u6c34\u5e73\u534f\u8bae (SLAs) \u7684\u5546\u4e1a API \u670d\u52a1\uff0c\u800c\u4e0d\u662f\u7ef4\u62a4\u4e00\u4e2a\u590d\u6742\u7684\u5f00\u6e90\u6846\u67b6\u53ca\u5176\u4f9d\u8d56\u9879\u3002<\/li>\n<\/ol>\n\n\n\n<h3 class=\"wp-block-heading\">RAG-Anything \u63a8\u8350\u573a\u666f<\/h3>\n\n\n\n<p>\u5982\u679c\u7528\u6237\u9700\u8981\u6ee1\u8db3\u4ee5\u4e0b\u6761\u4ef6\uff0c\u5219\u63a8\u8350\u4f7f\u7528 RAG-Anything\uff1a<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li><strong>\u6df1\u5ea6\u7684\u5173\u7cfb\u7406\u89e3\uff1a<\/strong> \u5e94\u7528\u7a0b\u5e8f\u4f9d\u8d56\u4e8e\u7406\u89e3\u591a\u6a21\u6001\u7ec4\u4ef6\u4e4b\u95f4\u7684\u8bed\u4e49\u5173\u7cfb\u548c\u5c42\u6b21\u7ed3\u6784\uff0c\u4f8b\u5982\u5728\u5b66\u672f\u7814\u7a76\u6216\u6280\u672f\u6587\u6863\u4e2d\uff0c\u4e0a\u4e0b\u6587\u81f3\u5173\u91cd\u8981\u3002<strong>\u591a\u6a21\u6001\u77e5\u8bc6\u56fe\u8c31<\/strong>\u80fd\u529b \u5728\u6b64\u7279\u522b\u9002\u7528\u3002<\/li>\n\n\n\n<li><strong>\u9ad8\u5ea6\u5b9a\u5236\u548c\u63a7\u5236\uff1a<\/strong> \u7528\u6237\u9700\u8981\u5bf9\u5904\u7406\u6d41\u7a0b\u3001\u89e3\u6790\u5668\uff08MinerU\/Docling\uff09 \u548c\u68c0\u7d22\u673a\u5236\u8fdb\u884c\u7cbe\u7ec6\u63a7\u5236\uff0c\u5e76\u53ef\u80fd\u5e0c\u671b\u5b9e\u65bd<strong>\u81ea\u5b9a\u4e49\u6a21\u6001\u5904\u7406\u5668<\/strong>\u3002<\/li>\n\n\n\n<li><strong>\u52a8\u6001 VLM \u67e5\u8be2\u5206\u6790\uff1a<\/strong> \u5bf9\u4e8e\u67e5\u8be2\u7ed3\u679c\u53d7\u76ca\u4e8e<strong>\u68c0\u7d22\u65f6\u5bf9\u89c6\u89c9\u7ec4\u4ef6\u8fdb\u884c\u5b9e\u65f6 VLM \u5206\u6790<\/strong>\u7684\u7528\u4f8b\uff0c\u4f8b\u5982\u8981\u6c42 LLM \u6839\u636e\u68c0\u7d22\u5230\u7684\u7279\u5b9a\u56fe\u50cf\u6765\u201c\u5206\u6790\u6587\u6863\u4e2d\u7684\u56fe\u8868\u548c\u6570\u5b57\u201d\u3002<\/li>\n\n\n\n<li><strong>\u5904\u7406\u590d\u6742\u7684\u6570\u5b66\u5185\u5bb9\uff1a<\/strong> \u6587\u6863\u4e2d\u7ecf\u5e38\u5305\u542b\u590d\u6742\u7684\u6570\u5b66\u8868\u8fbe\u5f0f\u548c\u516c\u5f0f\uff0c\u9700\u8981<strong>\u539f\u751f LaTeX \u683c\u5f0f\u89e3\u6790<\/strong>\u548c\u6982\u5ff5\u6620\u5c04\u3002<\/li>\n<\/ol>\n\n\n\n<hr class=\"wp-block-separator has-alpha-channel-opacity\"\/>\n\n\n\n<h2 class=\"wp-block-heading\">Comparison and Analysis of Reducto and RAG-Anything<\/h2>\n\n\n\n<p>Both Reducto and RAG-Anything leverage Vision-Language Models (VLMs) to enhance the understanding of multimodal documents, ensuring that non-textual content like images and tables are converted into <strong>LLM-ready<\/strong> data or integrated contextually for deeper insights. However, they differ significantly in their architecture, purpose, and VLM implementation focus.<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">1. Architectural Focus and System Nature<\/h3>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><tbody><tr><th>Feature<\/th><th>Reducto<\/th><th>RAG-Anything<\/th><\/tr><tr><td><strong>Nature<\/strong><\/td><td>Commercial product\/service, characterized as an &#8220;AI document parsing &amp; extraction software&#8221; offered via flexible APIs.<\/td><td>Open-source RAG framework, described as a &#8220;comprehensive <strong>All-in-One Multimodal Document Processing RAG system<\/strong>&#8221; built on LightRAG.<\/td><\/tr><tr><td><strong>Core Pipeline<\/strong><\/td><td>Uses a multi-pass system starting with <strong>Traditional Computer Vision<\/strong> (layout-aware models) for document breakdown, followed by VLM interpretation and VLM\/Agentic model corrections.<\/td><td>Implements a <strong>multi-stage multimodal pipeline<\/strong> (Document Parsing \u2192  Content Analysis \u2192  Knowledge Graph \u2192  Intelligent Retrieval).<\/td><\/tr><tr><td><strong>Enterprise Readiness<\/strong><\/td><td>Built for production AI, trusted by Fortune 10 enterprises, with 99.9%+ uptime, Enterprise support, and certifications (SOC2, HIPAA compliant). Can be deployed entirely within the user&#8217;s infrastructure.<\/td><td>Focuses on providing a flexible, integrated RAG framework. Requires user setup for dependencies (e.g., LibreOffice for Office documents) and external models (e.g., OpenAI&#8217;s GPT-4o for VLM functions).<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<h3 class=\"wp-block-heading\">2. VLM Utilization and Multimodal Processing<\/h3>\n\n\n\n<p>Both platforms use VLMs to bridge the gap between visual information and textual context, but they deploy them at different stages or for different primary goals:<\/p>\n\n\n\n<h4 class=\"wp-block-heading\">Reducto&#8217;s VLM Approach (Correction and Interpretation)<\/h4>\n\n\n\n<p>Reducto&#8217;s system uses VLMs primarily during the <em>content analysis and refinement<\/em> phases of document extraction.<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li><strong>Layout Segmentation (CV First):<\/strong> Traditional computer vision models first break down the document visually, identifying regions, tables, figures, and text.<\/li>\n\n\n\n<li><strong>Contextual Interpretation (VLM):<\/strong> VLMs then interpret each identified region <strong>in context<\/strong>. This is critical for tasks like linking labels to values, understanding complex tables, and classifying segments.<\/li>\n\n\n\n<li><strong>Accuracy Enhancement (Agentic Model\/VLM):<\/strong> Reducto features an <strong>Agentic model<\/strong>\u2014which performs like a human editor\u2014to detect minor mistakes and correct them, ensuring accuracy even in detailed cases. Reducto aims to produce the <strong>most accurate, LLM-ready results<\/strong>.<\/li>\n<\/ol>\n\n\n\n<h4 class=\"wp-block-heading\">RAG-Anything&#8217;s VLM Approach (Generation and Retrieval)<\/h4>\n\n\n\n<p>RAG-Anything utilizes VLMs both during the initial content processing stage and, notably, during the query stage:<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li><strong>Processing (Visual Content Analyzer):<\/strong> A dedicated <strong>Visual Content Analyzer<\/strong> integrates vision models to generate context-aware descriptive captions based on visual semantics. It also extracts spatial relationships and hierarchical structures between visual elements.<\/li>\n\n\n\n<li><strong>Querying (VLM-Enhanced Query Mode):<\/strong> RAG-Anything now features a <strong>VLM-Enhanced Query<\/strong> mode. When documents containing images are queried, the system automatically:\n<ul class=\"wp-block-list\">\n<li>Retrieves relevant context containing image paths.<\/li>\n\n\n\n<li>Loads and encodes the images as base64.<\/li>\n\n\n\n<li>Sends both the text context and the images directly to the VLM (e.g., GPT-4o) for comprehensive analysis <em>during retrieval\/answering<\/em>. This allows the VLM to combine visual and textual context for deeper insights. This mode can be automatically or manually enabled\/disabled.<\/li>\n<\/ul>\n<\/li>\n\n\n\n<li><strong>Multimodal Querying:<\/strong> RAG-Anything also supports specific <strong>Multimodal Queries<\/strong> where the user provides specific content (like table data or a LaTeX formula) alongside the query for enhanced analysis. <\/li>\n<\/ol>\n\n\n\n<h3 class=\"wp-block-heading\">3. Output Structure and Content Scope<\/h3>\n\n\n\n<p>Both systems aim to structure data for LLMs, but RAG-Anything places a heavy emphasis on relationship mapping:<\/p>\n\n\n\n<h4 class=\"wp-block-heading\">Data Structuring<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>Reducto:<\/strong> Focuses on extracting data into LLM-optimized formats, including <strong>intelligent chunking<\/strong>, <strong>figure summarization<\/strong>, <strong>graph extraction<\/strong>, and <strong>embedding optimization<\/strong>. The goal is to transform unstructured documents into structured, reliable data.<\/li>\n\n\n\n<li><strong>RAG-Anything:<\/strong> Transforms document content into structured semantic representations via a <strong>Multimodal Knowledge Graph Index<\/strong>. This process involves <strong>Multi-Modal Entity Extraction<\/strong> (with semantic annotations) and crucial <strong>Cross-Modal Relationship Mapping<\/strong> (establishing dependencies between textual entities and multimodal components). This framework uses hybrid retrieval combining vector search and graph traversal algorithms.<\/li>\n<\/ul>\n\n\n\n<h4 class=\"wp-block-heading\">Supported Content Types<\/h4>\n\n\n\n<ul class=\"wp-block-list\">\n<li><strong>Reducto:<\/strong> Supports PDFs, images, spreadsheets, slides. It handles complex documents like investor decks, SEC filings, dense pitch materials, complex tables, charts, and financial statements. It offers multilingual parsing across <strong>100+ languages<\/strong>.<\/li>\n\n\n\n<li><strong>RAG-Anything:<\/strong> Provides dedicated processors for <strong>images<\/strong>, <strong>tables<\/strong>, and <strong>mathematical equations<\/strong> (supporting native LaTeX format). It supports a wide range of document formats (PDFs, Office Documents, Images, Text Files). It also features an <strong>Extensible Modality Handler<\/strong> for custom and emerging content types.<\/li>\n<\/ul>\n\n\n\n<h3 class=\"wp-block-heading\">Detailed Analysis<\/h3>\n\n\n\n<p><strong>Reducto&#8217;s Strength: Accuracy and Production Readiness<\/strong> Reducto appears optimized for high-stakes, high-volume production environments where extraction accuracy is paramount (e.g., finance, healthcare, legal). Its reliance on an initial CV pass followed by VLM interpretation and, critically, VLM-based <strong>Agentic correction<\/strong> suggests a robust system designed to minimize errors inherent in initial parsing. The explicit focus on enterprise features (SLAs, security compliance, deployment options) makes it suitable for large organizations seeking a reliable, ready-to-use API.<\/p>\n\n\n\n<p><strong>RAG-Anything&#8217;s Strength: Semantic Depth and Flexibility<\/strong> RAG-Anything\u2019s strength lies in its <strong>All-in-One<\/strong> RAG framework approach and its advanced semantic structuring. By constructing a <strong>Multimodal Knowledge Graph<\/strong>, it goes beyond simple chunking or summarization to explicitly model the relationships between different content modalities (text, images, tables, equations). This relational coherence is maintained during retrieval, ensuring contextually integrated information delivery. Furthermore, the innovative <strong>VLM-Enhanced Query<\/strong> mode allows for dynamic, real-time VLM analysis of retrieved images during the final query phase, enabling deeper insights based on the retrieved context. The system also offers flexibility through multiple parser options (MinerU, Docling) and the ability to insert pre-parsed content lists.<\/p>\n\n\n\n<h2 class=\"wp-block-heading\">Application Recommendations<\/h2>\n\n\n\n<p>The choice between Reducto and RAG-Anything depends heavily on the user&#8217;s operational context, technical requirements, and end goal:<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">Recommendation for Reducto<\/h3>\n\n\n\n<p>Reducto is recommended when the user requires:<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li><strong>Maximum Extraction Accuracy:<\/strong> If the primary goal is highly reliable, structured data extraction from complex documents (like financial reports or legal filings) where even minor parsing errors are costly.<\/li>\n\n\n\n<li><strong>Enterprise Production Readiness:<\/strong> If the application requires high availability, dedicated enterprise support (SLAs), strict security compliance (HIPAA, SOC2), or deployment within a private environment.<\/li>\n\n\n\n<li><strong>API Integration Preference:<\/strong> If the user prefers integrating a streamlined, managed service via API rather than maintaining an open-source framework and its dependencies.<\/li>\n<\/ol>\n\n\n\n<h3 class=\"wp-block-heading\">Recommendation for RAG-Anything<\/h3>\n\n\n\n<p>RAG-Anything is recommended when the user requires:<\/p>\n\n\n\n<ol class=\"wp-block-list\">\n<li><strong>Deep Relational Understanding:<\/strong> If the application relies on understanding semantic relationships and hierarchical structure between multimodal components, such as in academic research or technical documentation where context is crucial. The <strong>Multimodal Knowledge Graph<\/strong> capability is ideal here.<\/li>\n\n\n\n<li><strong>Customization and Control:<\/strong> Since RAG-Anything is an open-source framework built on LightRAG, it is suitable for users who need fine-grained control over the processing pipeline, parsers (MinerU\/Docling), retrieval mechanisms, and who may want to implement custom modal processors.<\/li>\n\n\n\n<li><strong>Dynamic VLM Querying:<\/strong> For use cases where query results benefit from <strong>real-time VLM analysis<\/strong> of retrieved visual components, such as asking an LLM to &#8220;Analyze the charts and figures in the document&#8221; based on the specific images retrieved for the context.<\/li>\n\n\n\n<li><strong>Handling Mathematical Content:<\/strong> If documents frequently contain complex mathematical expressions and formulas that require native LaTeX format parsing and conceptual mapping.<\/li>\n<\/ol>\n","protected":false},"excerpt":{"rendered":"<p>Reducto \u548c RAG-Anything \u90fd\u5229\u7528\u89c6\u89c9-\u8bed\u8a00\u6a21\u578b\uff08VLM\uff09\u6765\u589e\u5f3a\u5bf9\u591a\u6a21\u6001\u6587\u6863\u7684\u7406\u89e3\uff0c\u786e\u4fdd\u56fe\u50cf [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"site-sidebar-layout":"default","site-content-layout":"","ast-site-content-layout":"default","site-content-style":"default","site-sidebar-style":"default","ast-global-header-display":"","ast-banner-title-visibility":"","ast-main-header-display":"","ast-hfb-above-header-display":"","ast-hfb-below-header-display":"","ast-hfb-mobile-header-display":"","site-post-title":"","ast-breadcrumbs-content":"","ast-featured-img":"","footer-sml-layout":"","ast-disable-related-posts":"","theme-transparent-header-meta":"","adv-header-id-meta":"","stick-header-meta":"","header-above-stick-meta":"","header-main-stick-meta":"","header-below-stick-meta":"","astra-migrate-meta-layouts":"set","ast-page-background-enabled":"default","ast-page-background-meta":{"desktop":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"ast-content-background-meta":{"desktop":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"tablet":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""},"mobile":{"background-color":"var(--ast-global-color-5)","background-image":"","background-repeat":"repeat","background-position":"center center","background-size":"auto","background-attachment":"scroll","background-type":"","background-media":"","overlay-type":"","overlay-color":"","overlay-opacity":"","overlay-gradient":""}},"footnotes":""},"categories":[3,8],"tags":[39,76,86,80],"class_list":["post-6399","post","type-post","status-publish","format-standard","hentry","category-it","category-tech","tag-ai","tag-rag","tag-llm","tag-cv"],"rttpg_featured_image_url":null,"rttpg_author":{"display_name":"NullThought","author_link":"https:\/\/nullthought.net\/?author=1"},"rttpg_comment":0,"rttpg_category":"<a href=\"https:\/\/nullthought.net\/?cat=3\" rel=\"category\">IT<\/a> <a href=\"https:\/\/nullthought.net\/?cat=8\" rel=\"category\">Tech<\/a>","rttpg_excerpt":"Reducto \u548c RAG-Anything \u90fd\u5229\u7528\u89c6\u89c9-\u8bed\u8a00\u6a21\u578b\uff08VLM\uff09\u6765\u589e\u5f3a\u5bf9\u591a\u6a21\u6001\u6587\u6863\u7684\u7406\u89e3\uff0c\u786e\u4fdd\u56fe\u50cf&hellip;","_links":{"self":[{"href":"https:\/\/nullthought.net\/index.php?rest_route=\/wp\/v2\/posts\/6399","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/nullthought.net\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/nullthought.net\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/nullthought.net\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/nullthought.net\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=6399"}],"version-history":[{"count":1,"href":"https:\/\/nullthought.net\/index.php?rest_route=\/wp\/v2\/posts\/6399\/revisions"}],"predecessor-version":[{"id":6402,"href":"https:\/\/nullthought.net\/index.php?rest_route=\/wp\/v2\/posts\/6399\/revisions\/6402"}],"wp:attachment":[{"href":"https:\/\/nullthought.net\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=6399"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/nullthought.net\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=6399"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/nullthought.net\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=6399"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}