Skip to content

Commit 7f85a1b

Browse files
committed
doc: add image to README.md
1 parent 68aa081 commit 7f85a1b

File tree

2 files changed

+41
-0
lines changed

2 files changed

+41
-0
lines changed

README.md

Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -659,6 +659,9 @@ When using this task, do not enable streaming. Otherwise, `completion.Output.Cho
659659
In addition to the standard text content, this task also returns the coordinates of the text.
660660

661661
To call this built-in task, set `Parameters.OcrOptions.Task` to `advanced_recognition`. No additional prompt is required.
662+
663+
![](sample/Cnblogs.DashScope.Sample/tilted.png)
664+
662665
```csharp
663666
var messages = new List<MultimodalMessage>();
664667
messages.Add(
@@ -743,6 +746,8 @@ You can customize the output JSON format via `Parameters.OcrOptions.TaskConfig.R
743746

744747
For example, suppose we want to extract objects of the following type from an image (JSON property names should, as much as possible, be based on the text present in the image):
745748

749+
![](sample/Cnblogs.DashScope.Sample/receipt.jpg)
750+
746751
```csharp
747752
internal class ReceiptModel()
748753
{
@@ -842,6 +847,8 @@ This task will extract tables from images and return them in HTML format.
842847

843848
Example:
844849

850+
![](sample/Cnblogs.DashScope.Sample/table.jpg)
851+
845852
```csharp
846853
await using var file = File.OpenRead("table.jpg");
847854
var ossLink = await client.UploadTemporaryFileAsync("qwen-vl-ocr-latest", file, "table.jpg");
@@ -1106,6 +1113,8 @@ This task read images(usually scanned PDF) and return them in LaTeX format.
11061113

11071114
Example:
11081115

1116+
![](sample/Cnblogs.DashScope.Sample/scanned.jpg)
1117+
11091118
```csharp
11101119
await using var file = File.OpenRead("scanned.jpg");
11111120
var ossLink = await client.UploadTemporaryFileAsync("qwen-vl-ocr-latest", file, "scanned.jpg");
@@ -1161,6 +1170,8 @@ This task read images(like handwriting formulas) and return them in LaTeX format
11611170

11621171
Example:
11631172

1173+
![](sample/Cnblogs.DashScope.Sample/math.jpg)
1174+
11641175
```csharp
11651176
// upload file
11661177
await using var file = File.OpenRead("math.jpg");
@@ -1207,6 +1218,18 @@ I^{m_n} - (L+1) &= z + \int_0^1 I^{m_n} - (L)z \leq x_m | L^{m_n} - (L) |^3 \\
12071218
```
12081219
````
12091220

1221+
$$
1222+
\begin{align*}
1223+
\tilde{G}(x) &= \frac{\alpha}{\kappa}x, \quad \tilde{T}_i = T, \quad \tilde{H}_i = \tilde{\kappa}T, \quad \tilde{\lambda}_i = \frac{1}{\kappa}\sum_{j=1}^{m}\omega_j - z_i, \\
1224+
L(\{p_n\}; m^n) + L(\{x^n\}, m^n) + L(\{m^n\}; q_n) &= L(m^n; q_n) \\
1225+
I^{m_n} - (L+1) &= z + \int_0^1 I^{m_n} - (L)z \leq x_m | L^{m_n} - (L) |^3 \\
1226+
&\leq \kappa\partial_1\psi(x) + \frac{\kappa^3}{6}\partial_2^3\psi(x) - V(x) \psi(x) = \int d^3y K(x,y) \psi(y), \\
1227+
\int_{B_{\kappa}(0)} I^{m}(w)^2 d\gamma &= \lim_{n\to\infty} \int_{B_{\kappa}(0)} r\psi(w_n)^2 d\gamma = \lim_{n\to\infty} \int_{B_{\kappa}(y_n)} d\gamma \geq \beta > 0,
1228+
\end{align*}
1229+
$$
1230+
1231+
1232+
12101233
##### Text Recognition
12111234

12121235
To invoke this built-in task, set `Parameters.OcrOptions.Task` to `text_recognition`. No additional text information needs to be provided.
@@ -1215,6 +1238,8 @@ This task read the images and returns content in plain text(Chinese and English
12151238

12161239
Example:
12171240

1241+
![](sample/Cnblogs.DashScope.Sample/webpage.jpg)
1242+
12181243
```csharp
12191244
// upload file
12201245
await using var file = File.OpenRead("webpage.jpg");
@@ -1250,6 +1275,8 @@ To invoke this built-in task, set `Parameters.OcrOptions.Task` to `multi_lan`. N
12501275

12511276
This task read the images and returns content in plain text(Support more languages).
12521277

1278+
![](sample/Cnblogs.DashScope.Sample/multilanguage.jpg)
1279+
12531280
```csharp
12541281
await using var file = File.OpenRead("multilanguage.jpg");
12551282
var ossLink = await client.UploadTemporaryFileAsync("qwen-vl-ocr-latest", file, "multilanguage.jpg");

README.zh-Hans.md

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2585,6 +2585,8 @@ var completion = client.GetMultimodalGenerationAsync(
25852585
25862586
示例:
25872587
2588+
![倾斜的图像](sample/Cnblogs.DashScope.Sample/tilted.png)
2589+
25882590
```csharp
25892591
Console.WriteLine("Text:");
25902592
Console.WriteLine(completion.Output.Choices[0].Message.Content[0].Text);
@@ -2669,6 +2671,8 @@ internal class ReceiptSerials
26692671
26702672
示例请求:
26712673
2674+
![车票](sample/Cnblogs.DashScope.Sample/receipt.jpg)
2675+
26722676
```csharp
26732677
await using var file = File.OpenRead("receipt.jpg");
26742678
var ossLink = await client.UploadTemporaryFileAsync("qwen-vl-ocr-latest", file, "receipt.jpg");
@@ -2745,6 +2749,8 @@ Usage: in(524)/out(65)/image(310)/total(589)
27452749
27462750
示例:
27472751
2752+
![表格](sample/Cnblogs.DashScope.Sample/table.jpg)
2753+
27482754
```csharp
27492755
await using var file = File.OpenRead("table.jpg");
27502756
var ossLink = await client.UploadTemporaryFileAsync("qwen-vl-ocr-latest", file, "table.jpg");
@@ -3007,6 +3013,8 @@ Console.WriteLine(completion.Output.Choices[0].Message.Content[0].Text);
30073013
30083014
该任务会识读图片(例如扫描版 PDF)并返回 LaTeX 格式的文档。
30093015
3016+
![论文](sample/Cnblogs.DashScope.Sample/scanned.jpg)
3017+
30103018
```csharp
30113019
await using var file = File.OpenRead("scanned.jpg");
30123020
var ossLink = await client.UploadTemporaryFileAsync("qwen-vl-ocr-latest", file, "scanned.jpg");
@@ -3060,6 +3068,8 @@ Recent advancements in large vision-language models (LVLMS) (Li et al., 2023c; L
30603068
30613069
该任务会识读图片中的公式(例如手写数学公式)并以 LaTeX 形式返回。
30623070
3071+
![手写数学公式](sample/Cnblogs.DashScope.Sample/math.jpg)
3072+
30633073
```csharp
30643074
// upload file
30653075
await using var file = File.OpenRead("math.jpg");
@@ -3114,6 +3124,8 @@ I^{m_n} - (L+1) &= z + \int_0^1 I^{m_n} - (L)z \leq x_m | L^{m_n} - (L) |^3 \\
31143124
31153125
示例请求:
31163126
3127+
![网页](sample/Cnblogs.DashScope.Sample/webpage.jpg)
3128+
31173129
```csharp
31183130
// upload file
31193131
await using var file = File.OpenRead("webpage.jpg");
@@ -3153,6 +3165,8 @@ Python Java curl
31533165
31543166
示例请求:
31553167
3168+
![Hello](sample/Cnblogs.DashScope.Sample/multilanguage.jpg)
3169+
31563170
```csharp
31573171
await using var file = File.OpenRead("multilanguage.jpg");
31583172
var ossLink = await client.UploadTemporaryFileAsync("qwen-vl-ocr-latest", file, "multilanguage.jpg");

0 commit comments

Comments
 (0)