You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
"description": "Whisper is a pre-trained model for automatic speech recognition (ASR) and speech translation. Trained on 680k hours of labelled data, Whisper models demonstrate a strong ability to generalize to many datasets and domains without the need for fine-tuning. This is the English-only version of the Whisper Tiny model which was trained on the task of speech recognition.",
6
-
"task": {
7
-
"id": "dfce1c48-2a81-462e-a7fd-de97ce985207",
8
-
"name": "Automatic Speech Recognition",
9
-
"description": "Automatic speech recognition (ASR) models convert a speech signal, typically an audio input, to text."
10
-
},
11
-
"tags": [],
12
-
"properties": [
13
-
{
14
-
"property_id": "beta",
15
-
"value": "true"
16
-
}
17
-
],
18
-
"schema": {
19
-
"input": {
20
-
"oneOf": [
21
-
{
22
-
"type": "string",
23
-
"format": "binary"
24
-
},
25
-
{
26
-
"type": "object",
27
-
"properties": {
28
-
"audio": {
29
-
"type": "array",
30
-
"description": "An array of integers that represent the audio data constrained to 8-bit unsigned integer values",
31
-
"items": {
32
-
"type": "number",
33
-
"description": "A value between 0 and 255"
34
-
}
35
-
}
36
-
},
37
-
"required": ["audio"]
38
-
}
39
-
]
40
-
},
41
-
"output": {
42
-
"type": "object",
43
-
"contentType": "application/json",
44
-
"properties": {
45
-
"text": {
46
-
"type": "string",
47
-
"description": "The transcription"
48
-
},
49
-
"word_count": {
50
-
"type": "number"
51
-
},
52
-
"words": {
53
-
"type": "array",
54
-
"items": {
55
-
"type": "object",
56
-
"properties": {
57
-
"word": {
58
-
"type": "string"
59
-
},
60
-
"start": {
61
-
"type": "number",
62
-
"description": "The second this word begins in the recording"
63
-
},
64
-
"end": {
65
-
"type": "number",
66
-
"description": "The ending second when the word completes"
67
-
}
68
-
}
69
-
}
70
-
},
71
-
"vtt": {
72
-
"type": "string"
73
-
}
74
-
},
75
-
"required": ["text"]
76
-
}
77
-
}
78
-
}
2
+
"id": "2169496d-9c0e-4e49-8399-c44ee66bff7d",
3
+
"source": 1,
4
+
"name": "@cf/openai/whisper-tiny-en",
5
+
"description": "Whisper is a pre-trained model for automatic speech recognition (ASR) and speech translation. Trained on 680k hours of labelled data, Whisper models demonstrate a strong ability to generalize to many datasets and domains without the need for fine-tuning. This is the English-only version of the Whisper Tiny model which was trained on the task of speech recognition.",
6
+
"task": {
7
+
"id": "dfce1c48-2a81-462e-a7fd-de97ce985207",
8
+
"name": "Automatic Speech Recognition",
9
+
"description": "Automatic speech recognition (ASR) models convert a speech signal, typically an audio input, to text."
10
+
},
11
+
"tags": [],
12
+
"properties": [
13
+
{
14
+
"property_id": "beta",
15
+
"value": "true"
16
+
}
17
+
],
18
+
"schema": {
19
+
"input": {
20
+
"oneOf": [
21
+
{
22
+
"type": "string",
23
+
"format": "binary"
24
+
},
25
+
{
26
+
"type": "object",
27
+
"properties": {
28
+
"audio": {
29
+
"type": "array",
30
+
"description": "An array of integers that represent the audio data constrained to 8-bit unsigned integer values",
31
+
"items": {
32
+
"type": "number",
33
+
"description": "A value between 0 and 255"
34
+
}
35
+
}
36
+
},
37
+
"required": [
38
+
"audio"
39
+
]
40
+
}
41
+
]
42
+
},
43
+
"output": {
44
+
"type": "object",
45
+
"contentType": "application/json",
46
+
"properties": {
47
+
"text": {
48
+
"type": "string",
49
+
"description": "The transcription"
50
+
},
51
+
"word_count": {
52
+
"type": "number"
53
+
},
54
+
"words": {
55
+
"type": "array",
56
+
"items": {
57
+
"type": "object",
58
+
"properties": {
59
+
"word": {
60
+
"type": "string"
61
+
},
62
+
"start": {
63
+
"type": "number",
64
+
"description": "The second this word begins in the recording"
65
+
},
66
+
"end": {
67
+
"type": "number",
68
+
"description": "The ending second when the word completes"
0 commit comments