-
Notifications
You must be signed in to change notification settings - Fork 30
Expand file tree
/
Copy pathmsgqueue.c
More file actions
112 lines (86 loc) · 2.87 KB
/
msgqueue.c
File metadata and controls
112 lines (86 loc) · 2.87 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
// SPDX-FileCopyrightText: © 2026 Tenstorrent Inc.
// SPDX-License-Identifier: GPL-2.0-only
#include "msgqueue.h"
#include <linux/jiffies.h>
#include <linux/delay.h>
#include <linux/pci.h>
#include "device.h"
bool arc_msg_push(struct tenstorrent_device *tt_dev, const struct arc_msg *msg, u32 queue_base, u32 num_entries)
{
const struct tenstorrent_device_class *cls = tt_dev->dev_class;
u32 request_base = queue_base + ARC_MSG_QUEUE_HEADER_SIZE;
unsigned long timeout;
u32 wptr;
u32 slot;
u32 req_offset;
int i;
if (cls->csm_read32(tt_dev, ARC_MSG_QUEUE_REQ_WPTR(queue_base), &wptr) != 0)
return false;
timeout = jiffies + msecs_to_jiffies(ARC_MSG_TIMEOUT_MS);
for (;;) {
u32 rptr;
u32 num_occupied;
if (cls->csm_read32(tt_dev, ARC_MSG_QUEUE_REQ_RPTR(queue_base), &rptr) != 0)
return false;
num_occupied = (wptr - rptr) % (2 * num_entries);
if (num_occupied < num_entries)
break;
if (time_after(jiffies, timeout)) {
dev_err(&tt_dev->pdev->dev, "Timeout waiting for space in ARC message queue\n");
return false;
}
usleep_range(100, 200);
}
slot = wptr % num_entries;
req_offset = slot * sizeof(struct arc_msg);
for (i = 0; i < 8; ++i) {
u32 addr = request_base + req_offset + (i * sizeof(u32));
u32 value = (i == 0) ? msg->header : msg->payload[i - 1];
if (cls->csm_write32(tt_dev, addr, value) != 0)
return false;
}
wptr = (wptr + 1) % (2 * num_entries);
if (cls->csm_write32(tt_dev, ARC_MSG_QUEUE_REQ_WPTR(queue_base), wptr) != 0)
return false;
return true;
}
bool arc_msg_pop(struct tenstorrent_device *tt_dev, struct arc_msg *msg, u32 queue_base, u32 num_entries)
{
const struct tenstorrent_device_class *cls = tt_dev->dev_class;
u32 response_base = queue_base + ARC_MSG_QUEUE_HEADER_SIZE + (num_entries * sizeof(struct arc_msg));
unsigned long timeout;
u32 rptr;
u32 slot;
u32 response_offset;
int i;
if (cls->csm_read32(tt_dev, ARC_MSG_QUEUE_RES_RPTR(queue_base), &rptr) != 0)
return false;
timeout = jiffies + msecs_to_jiffies(ARC_MSG_TIMEOUT_MS);
for (;;) {
u32 wptr;
u32 num_occupied;
if (cls->csm_read32(tt_dev, ARC_MSG_QUEUE_RES_WPTR(queue_base), &wptr) != 0)
return false;
num_occupied = (wptr - rptr) % (2 * num_entries);
if (num_occupied > 0)
break;
if (time_after(jiffies, timeout)) {
dev_err(&tt_dev->pdev->dev, "Timeout waiting for ARC response\n");
return false;
}
usleep_range(100, 200);
}
slot = rptr % num_entries;
response_offset = slot * sizeof(struct arc_msg);
if (cls->csm_read32(tt_dev, response_base + response_offset, &msg->header) != 0)
return false;
for (i = 0; i < 7; ++i) {
u32 addr = response_base + response_offset + ((i + 1) * sizeof(u32));
if (cls->csm_read32(tt_dev, addr, &msg->payload[i]) != 0)
return false;
}
rptr = (rptr + 1) % (2 * num_entries);
if (cls->csm_write32(tt_dev, ARC_MSG_QUEUE_RES_RPTR(queue_base), rptr) != 0)
return false;
return true;
}