generated from amazon-archives/__template_MIT-0
-
Notifications
You must be signed in to change notification settings - Fork 53
Expand file tree
/
Copy pathmain.go
More file actions
100 lines (82 loc) · 2.97 KB
/
main.go
File metadata and controls
100 lines (82 loc) · 2.97 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
package main
import (
"context"
"flag"
"image"
_ "image/jpeg"
_ "image/png"
"log"
"github.com/aws/aws-sdk-go-v2/aws"
"github.com/aws/aws-sdk-go-v2/config"
"github.com/aws/aws-sdk-go-v2/service/rekognition"
"github.com/aws/aws-sdk-go-v2/service/rekognition/types"
"github.com/aws/aws-sdk-go-v2/service/s3"
"github.com/fogleman/gg"
)
var bucketName = flag.String("bucket", "", "The name of the bucket to get the object")
var key = flag.String("key", "", "The s3 object key to the image file (JPEG, JPG, PNG)")
var modelArn = flag.String("model-arn", "", "The rekognition custom labels model arn")
var minConfidence = float32(*flag.Float64("min-confidence", 70, "The minimum confidence value "))
func main() {
flag.Parse()
cfg, err := config.LoadDefaultConfig(context.TODO())
if err != nil {
log.Fatalf("unable to load SDK config, %v", err)
}
svc := rekognition.NewFromConfig(cfg)
var s3Obj = types.S3Object{
Bucket: bucketName,
Name: key}
resp, err := svc.DetectCustomLabels(context.TODO(), &rekognition.DetectCustomLabelsInput{
Image: &types.Image{
S3Object: &s3Obj},
ProjectVersionArn: modelArn,
MinConfidence: aws.Float32(minConfidence),
})
if err != nil {
log.Fatalf("unable to detect custom labels, %v", err)
}
log.Printf("Detected %v labels", len(resp.CustomLabels))
for _, label := range resp.CustomLabels {
log.Printf("%v: %v\b", *label.Name, *label.Confidence)
}
s3Client := s3.NewFromConfig(cfg)
input := s3.GetObjectInput{
Bucket: bucketName,
Key: key,
}
s3Resp, err := s3Client.GetObject(context.TODO(), &input)
if err != nil {
log.Fatalf("unable to retrieve image: %v", err)
}
i, _, err := image.Decode(s3Resp.Body)
if err != nil {
log.Fatalf("can't decode image: %v", err)
}
ggContext := gg.NewContextForImage(i)
err = ggContext.LoadFontFace("/Library/Fonts/Arial Unicode.ttf", 100)
if err != nil {
log.Fatalf("Unable to load font: %v", err)
}
ggContext.SetRGB(1, 0, 0)
ggContext.SetLineWidth(10)
for i, label := range resp.CustomLabels {
x := float64(*label.Geometry.BoundingBox.Left) * float64(ggContext.Width())
y := float64(*label.Geometry.BoundingBox.Top) * float64(ggContext.Height())
w := float64(*label.Geometry.BoundingBox.Width) * float64(ggContext.Width())
h := float64(*label.Geometry.BoundingBox.Height) * float64(ggContext.Height())
log.Printf("Detected label #%v: %v", i, *label.Name)
log.Printf("\tLeft: %v", x)
log.Printf("\tTop: %v", y)
log.Printf("\tWidth: %v", w)
log.Printf("\tHeight: %v", h)
ggContext.DrawRectangle(x, y, w, h)
ggContext.Stroke()
ggContext.DrawString(*label.Name, x, y)
ggContext.Stroke()
}
err = ggContext.SavePNG("output.png")
if err != nil {
log.Fatalf("error saving image: %v", err)
}
}