[update] add batch inference guide

SunnyHaze · SunnyHaze · commit 68f41bbddb21 · 2025-12-30T12:18:59.000+08:00
diff --git a/docs/.vuepress/notes/en/guide.ts b/docs/.vuepress/notes/en/guide.ts
@@ -48,7 +48,17 @@ export const Guide: ThemeNote = defineNoteConfig({
             ],
 
         },
-        
+        {
+            text: 'Preview Features',
+            collapsed: false,
+            icon: 'carbon:idea',
+            prefix: 'new_feature',
+            items: [
+                "resume",
+                "batch"
+            ],
+        },
+
         // {
         //     text: 'Dataflow Agent',
         //     collapsed: false,
diff --git a/docs/.vuepress/notes/zh/guide.ts b/docs/.vuepress/notes/zh/guide.ts
@@ -55,6 +55,16 @@ export const Guide: ThemeNote = defineNoteConfig({
                 'speech_transcription',
             ],
         },
+        {
+            text: '内测功能',
+            collapsed: false,
+            icon: 'carbon:idea',
+            prefix: 'new_feature',
+            items: [
+                "resume",
+                "batch"
+            ],
+        },
 
         {
             text:"流水线教程",
diff --git a/docs/en/notes/guide/new_feature/batch.md b/docs/en/notes/guide/new_feature/batch.md
@@ -0,0 +1,107 @@
+---
+title: Preview-Batched Inference
+createTime: 2025/12/30 11:47:05
+permalink: /en/guide/batch/
+---
+
+
+# Beta: Checkpoint Resume
+
+> This feature is currently in beta and may contain bugs. If you encounter any issues, please report them via issues. Thank you for your understanding.
+
+## Overview
+
+During inference, if an operator holds a large amount of data—such as thousands of records—and an unexpected interruption occurs midway, the portion that has already been inferred will be lost, resulting in wasted API calls.
+
+To address this problem, we designed a **batched inference** interface with the following workflow:
+
+1. Start inference for the first operator
+2. The first operator processes only one batch at a time
+3. The output of the current step is stored in an appendable output step file (e.g., JSONL or CSV)
+4. Once the entire dataset has been processed by the current operator, proceed to the next operator
+5. The entire pipeline is completed using this approach
+
+## Usage
+
+This is similar to [Framework Design – Resume Pipeline](/en/guide/basicinfo/framework/#breakpoint-resume-pipelines-resume), except that the pipeline must inherit from another base class, `BatchedPipelineABC`. It also needs to be compiled, and the `forward` function requires additional parameters. In addition, `Storage` currently needs to inherit from a special `BatchedFileStorage` class.
+
+```python
+import re
+from dataflow.pipeline import BatchedPipelineABC  # [!code highlight]
+from dataflow.operators.general_text import (
+    LLMLanguageFilter,
+)
+from dataflow.operators.text_pt import MetaSampleEvaluator
+from dataflow.operators.core_text import PromptedGenerator
+from dataflow.serving import APILLMServing_request
+from dataflow.utils.storage import BatchedFileStorage  # [!code highlight]
+
+class AutoOPPipeline(BatchedPipelineABC):  # [!code highlight]
+    
+    def __init__(self):
+        super().__init__()
+        self.storage = BatchedFileStorage(  # [!code highlight]
+            first_entry_file_name="./dataflow/example/GeneralTextPipeline/pt_input.jsonl",
+            cache_path="./cache_autoop",
+            file_name_prefix="dataflow_cache_auto_run",
+            cache_type="jsonl",
+        )
+        self.llm_serving = APILLMServing_request(
+            api_url="http://api.openai.com/v1/chat/completions",
+            model_name="gpt-4o",
+            max_workers=30
+        )
+        self.op1 = PromptedGenerator(
+            llm_serving=self.llm_serving1,
+            system_prompt="Please translate the following content into Chinese:",
+        )
+        self.op2 = PromptedGenerator(
+            llm_serving=self.llm_serving1,
+            system_prompt="Please translate the following content into Korean:",
+        )
+        self.op3 = PromptedGenerator(
+            llm_serving=self.llm_serving1,
+            system_prompt="Please translate the following content into Japanese:"
+        )
+        
+    def forward(self):
+        self.op1.run(
+            self.storage.step(),
+            input_key='raw_content',
+            output_key='content_cn1'
+        )
+        self.op2.run(
+            self.storage.step(),
+            input_key='raw_content',
+            output_key='content_cn2'
+        )
+        self.op3.run(
+            self.storage.step(),
+            input_key='raw_content',
+            output_key='content_cn3'
+        )
+        
+if __name__ == "__main__":
+    pipeline = AutoOPPipeline()
+    pipeline.compile()  # [!code highlight]
+    pipeline.forward(
+        batch_size=2,  # [!code highlight]
+        resume_from_last=True
+    )
+```
+
+`resume_from_last` allows the pipeline to automatically continue from the last step file found in the current cache path.
+
+Alternatively, you can use `resume_step` to resume from a specific previous operator step. Note that **only one of these parameters can be set at a time** to avoid logical conflicts.
+
+```python
+    # The following invocation is also valid
+    ...
+    pipeline.compile()
+    pipeline.forward(
+        batch_size=2,
+        resume_step=2  # Resume from the operator with index 2; the first operator has index 0
+    )
+```
+
+---
diff --git a/docs/en/notes/guide/new_feature/resume.md b/docs/en/notes/guide/new_feature/resume.md
@@ -0,0 +1,21 @@
+---
+title: Preview-Checkpoint Resume
+createTime: 2025/12/30 11:19:40
+permalink: /en/guide/resume/
+---
+
+
+# Beta: Checkpoint Resume
+
+> This feature is currently in beta and may contain bugs. If you encounter any issues, please report them via issues. Thank you for your understanding.
+
+## Overview
+
+During inference, if the process is interrupted at a certain operator, the default workflow requires rerunning the entire pipeline from the previous operator. This typically involves commenting out all preceding operators in the pipeline and manually renaming intermediate cached step files as the new entry point, which is cumbersome and error-prone.
+
+To address this, we provide a feature that allows inference to be resumed directly from a specific operator step.
+
+## Usage
+
+Please refer to the section
+[Framework Design – Resume Pipelines](/en/guide/basicinfo/framework/#breakpoint-resume-pipelines-resume) for details.
diff --git a/docs/zh/notes/guide/new_feature/batch.md b/docs/zh/notes/guide/new_feature/batch.md
@@ -0,0 +1,98 @@
+---
+title: 内测：Batch化推理
+createTime: 2025/12/30 11:47:05
+permalink: /zh/guide/batch/
+---
+# 内测：断点Resume
+> 此功能处于内测阶段，可能有bug，发现问题请及时通过issue反馈，感谢理解
+
+## 概述
+推理时，如果一个算子持有大量数据，比如几千条数据，中间发生了异常中断，这几千条中已经推理的部分会原地丢失，相应的API也会被浪费掉。
+
+为了解决这个问题，我们设计了Batch化推理的接口，流程如下：
+
+1. 开始推理第一个算子
+2. 第一个算子一次只给输入一个batch
+3. 当前step输出的结果存放在一个可以append的输出step文件中（比如jsonl或者csv）
+4. 直到整个数据集的数据都在当前算子推理完成，继续推理下一个算子。
+5. 整个pipeline都按照这个方式推理完成
+
+## 使用方法
+与[框架设计-resume流水线](/zh/guide/basicinfo/framework/#断点恢复流水线-resume)相似，不过pipeline需要继承另一个基类`BatchedPipelineABC`来实现，也同样需要compile，并且在forward函数中传入更多的形参。此外目前`Storage`也需要继承另一个特殊的`BatchedFileStorage`类。
+```python
+import re
+from dataflow.pipeline import BatchedPipelineABC  # [!code highlight]
+from dataflow.operators.general_text import (
+    LLMLanguageFilter,
+)
+from dataflow.operators.text_pt import MetaSampleEvaluator
+from dataflow.operators.core_text import PromptedGenerator
+from dataflow.serving import APILLMServing_request
+from dataflow.utils.storage import BatchedFileStorage  # [!code highlight]
+
+class AutoOPPipeline(BatchedPipelineABC):  # [!code highlight]
+    
+    def __init__(self):
+        super().__init__()
+        self.storage = BatchedFileStorage( # [!code highlight]
+            first_entry_file_name="./dataflow/example/GeneralTextPipeline/pt_input.jsonl",
+            cache_path="./cache_autoop",
+            file_name_prefix="dataflow_cache_auto_run",
+            cache_type="jsonl",
+        )
+        self.llm_serving = APILLMServing_request(
+                    api_url="http://api.openai.com/v1/chat/completions",
+                    model_name="gpt-4o",
+                    max_workers=30
+        )
+        self.op1 = PromptedGenerator(
+            llm_serving=self.llm_serving1,
+            system_prompt="请将以下内容翻译成中文：",
+        )
+        self.op2 = PromptedGenerator(
+            llm_serving=self.llm_serving1,
+            system_prompt="请将以下内容翻译成韩文：",
+        )
+        self.op3 = PromptedGenerator(
+            llm_serving=self.llm_serving1,
+            system_prompt="请将以下内容翻译成日语："
+        )
+        
+    def forward(self):
+        self.op1.run(
+            self.storage.step(),
+            input_key='raw_content',
+            output_key='content_cn1'
+        )
+        self.op2.run(
+            self.storage.step(),
+            input_key='raw_content',
+            output_key='content_cn2'
+        )
+        self.op3.run(
+            self.storage.step(),
+            input_key='raw_content',
+            output_key='content_cn3'
+        )
+        
+if __name__ == "__main__":
+    pipeline = AutoOPPipeline()
+    pipeline.compile() # [!code highlight]
+    pipeline.forward(
+        batch_size=2,  # [!code highlight]
+        resume_from_last=True 
+    )
+```
+
+`resume_from_last`可以直接从当前cache路径下读取到的最后一个step文件，自动继续训练。
+特别的，也可以使用`resume_step`来从具体的一个之前的某一个具体的算子step恢复。不过这两个形参只能设置其中一个避免逻辑冲突。
+```python
+    # 以下调用方式也是可以的
+    ...
+    pipeline.compile()
+    pipeline.forward(
+        batch_size=2, 
+        resume_step=2  # 从index为2的算子恢复，第一个算子的index是0
+    )
+```
+
diff --git a/docs/zh/notes/guide/new_feature/resume.md b/docs/zh/notes/guide/new_feature/resume.md
@@ -0,0 +1,13 @@
+---
+title: 内测：断点恢复resume
+createTime: 2025/12/30 11:19:40
+permalink: /zh/guide/resume/
+---
+# 内测：断点Resume
+> 此功能处于内测阶段，可能有bug，发现问题请及时通过issue反馈，感谢理解
+
+## 概述
+当推理时，于某个算子断掉了，此时按照默认流程，想从前一个算子重新跑整个流程，要把整个pipeline前面的算子注释掉，并且修改中间缓存的step文件的名称作为入口，这很麻烦。所以我们提供了一个可以从算子step进行恢复推理的功能。
+
+## 使用方法
+请参考[框架设计-resume流水线](/zh/guide/basicinfo/framework/#断点恢复流水线-resume)章节。
diff --git a/docs/zh/notes/guide/quickstart/write_operator.md b/docs/zh/notes/guide/quickstart/write_operator.md
@@ -0,0 +1,5 @@
+---
+title: write_operator
+createTime: 2025/12/29 11:05:15
+permalink: /zh/guide/livgzy4s/
+---
diff --git a/docs/zh/notes/guide/quickstart/write_pipeline.md b/docs/zh/notes/guide/quickstart/write_pipeline.md
@@ -0,0 +1,5 @@
+---
+title: write_pipeline
+createTime: 2025/12/29 11:05:05
+permalink: /zh/guide/r8flkmy0/
+---