]>
Commit | Line | Data |
---|---|---|
3a4d5c94 MT |
1 | #ifndef _VHOST_H |
2 | #define _VHOST_H | |
3 | ||
4 | #include <linux/eventfd.h> | |
5 | #include <linux/vhost.h> | |
6 | #include <linux/mm.h> | |
7 | #include <linux/mutex.h> | |
3a4d5c94 MT |
8 | #include <linux/poll.h> |
9 | #include <linux/file.h> | |
3a4d5c94 MT |
10 | #include <linux/uio.h> |
11 | #include <linux/virtio_config.h> | |
12 | #include <linux/virtio_ring.h> | |
60063497 | 13 | #include <linux/atomic.h> |
3a4d5c94 MT |
14 | |
15 | struct vhost_device; | |
16 | ||
c23f3445 TH |
17 | struct vhost_work; |
18 | typedef void (*vhost_work_fn_t)(struct vhost_work *work); | |
19 | ||
20 | struct vhost_work { | |
21 | struct list_head node; | |
22 | vhost_work_fn_t fn; | |
23 | wait_queue_head_t done; | |
24 | int flushing; | |
25 | unsigned queue_seq; | |
26 | unsigned done_seq; | |
27 | }; | |
28 | ||
3a4d5c94 MT |
29 | /* Poll a file (eventfd or socket) */ |
30 | /* Note: there's nothing vhost specific about this structure. */ | |
31 | struct vhost_poll { | |
32 | poll_table table; | |
33 | wait_queue_head_t *wqh; | |
34 | wait_queue_t wait; | |
c23f3445 | 35 | struct vhost_work work; |
3a4d5c94 | 36 | unsigned long mask; |
c23f3445 | 37 | struct vhost_dev *dev; |
3a4d5c94 MT |
38 | }; |
39 | ||
163049ae SH |
40 | void vhost_work_init(struct vhost_work *work, vhost_work_fn_t fn); |
41 | void vhost_work_queue(struct vhost_dev *dev, struct vhost_work *work); | |
42 | ||
c23f3445 TH |
43 | void vhost_poll_init(struct vhost_poll *poll, vhost_work_fn_t fn, |
44 | unsigned long mask, struct vhost_dev *dev); | |
3a4d5c94 MT |
45 | void vhost_poll_start(struct vhost_poll *poll, struct file *file); |
46 | void vhost_poll_stop(struct vhost_poll *poll); | |
47 | void vhost_poll_flush(struct vhost_poll *poll); | |
48 | void vhost_poll_queue(struct vhost_poll *poll); | |
49 | ||
50 | struct vhost_log { | |
51 | u64 addr; | |
52 | u64 len; | |
53 | }; | |
54 | ||
bab632d6 MT |
55 | struct vhost_virtqueue; |
56 | ||
57 | struct vhost_ubuf_ref { | |
58 | struct kref kref; | |
59 | wait_queue_head_t wait; | |
60 | struct vhost_virtqueue *vq; | |
61 | }; | |
62 | ||
63 | struct vhost_ubuf_ref *vhost_ubuf_alloc(struct vhost_virtqueue *, bool zcopy); | |
64 | void vhost_ubuf_put(struct vhost_ubuf_ref *); | |
65 | void vhost_ubuf_put_and_wait(struct vhost_ubuf_ref *); | |
66 | ||
b211616d MT |
67 | struct ubuf_info; |
68 | ||
3a4d5c94 MT |
69 | /* The virtqueue structure describes a queue attached to a device. */ |
70 | struct vhost_virtqueue { | |
71 | struct vhost_dev *dev; | |
72 | ||
73 | /* The actual ring of buffers. */ | |
74 | struct mutex mutex; | |
75 | unsigned int num; | |
76 | struct vring_desc __user *desc; | |
77 | struct vring_avail __user *avail; | |
78 | struct vring_used __user *used; | |
79 | struct file *kick; | |
80 | struct file *call; | |
81 | struct file *error; | |
82 | struct eventfd_ctx *call_ctx; | |
83 | struct eventfd_ctx *error_ctx; | |
84 | struct eventfd_ctx *log_ctx; | |
85 | ||
86 | struct vhost_poll poll; | |
87 | ||
88 | /* The routine to call when the Guest pings us, or timeout. */ | |
c23f3445 | 89 | vhost_work_fn_t handle_kick; |
3a4d5c94 MT |
90 | |
91 | /* Last available index we saw. */ | |
92 | u16 last_avail_idx; | |
93 | ||
94 | /* Caches available index value from user. */ | |
95 | u16 avail_idx; | |
96 | ||
97 | /* Last index we used. */ | |
98 | u16 last_used_idx; | |
99 | ||
100 | /* Used flags */ | |
101 | u16 used_flags; | |
102 | ||
8ea8cf89 MT |
103 | /* Last used index value we have signalled on */ |
104 | u16 signalled_used; | |
105 | ||
106 | /* Last used index value we have signalled on */ | |
107 | bool signalled_used_valid; | |
108 | ||
3a4d5c94 MT |
109 | /* Log writes to used structure. */ |
110 | bool log_used; | |
111 | u64 log_addr; | |
112 | ||
e0e9b406 JW |
113 | struct iovec iov[UIO_MAXIOV]; |
114 | /* hdr is used to store the virtio header. | |
115 | * Since each iovec has >= 1 byte length, we never need more than | |
116 | * header length entries to store the header. */ | |
117 | struct iovec hdr[sizeof(struct virtio_net_hdr_mrg_rxbuf)]; | |
118 | struct iovec *indirect; | |
8dd014ad DS |
119 | size_t vhost_hlen; |
120 | size_t sock_hlen; | |
e0e9b406 | 121 | struct vring_used_elem *heads; |
3a4d5c94 | 122 | /* We use a kind of RCU to access private pointer. |
c23f3445 TH |
123 | * All readers access it from worker, which makes it possible to |
124 | * flush the vhost_work instead of synchronize_rcu. Therefore readers do | |
3a4d5c94 | 125 | * not need to call rcu_read_lock/rcu_read_unlock: the beginning of |
c23f3445 | 126 | * vhost_work execution acts instead of rcu_read_lock() and the end of |
a290aec8 | 127 | * vhost_work execution acts instead of rcu_read_unlock(). |
3a4d5c94 | 128 | * Writers use virtqueue mutex. */ |
28457ee6 | 129 | void __rcu *private_data; |
3a4d5c94 MT |
130 | /* Log write descriptors */ |
131 | void __user *log_base; | |
e0e9b406 | 132 | struct vhost_log *log; |
bab632d6 MT |
133 | /* vhost zerocopy support fields below: */ |
134 | /* last used idx for outstanding DMA zerocopy buffers */ | |
135 | int upend_idx; | |
136 | /* first used idx for DMA done zerocopy buffers */ | |
137 | int done_idx; | |
138 | /* an array of userspace buffers info */ | |
139 | struct ubuf_info *ubuf_info; | |
140 | /* Reference counting for outstanding ubufs. | |
141 | * Protected by vq mutex. Writers must also take device mutex. */ | |
142 | struct vhost_ubuf_ref *ubufs; | |
3a4d5c94 MT |
143 | }; |
144 | ||
145 | struct vhost_dev { | |
146 | /* Readers use RCU to access memory table pointer | |
147 | * log base pointer and features. | |
148 | * Writers use mutex below.*/ | |
28457ee6 | 149 | struct vhost_memory __rcu *memory; |
3a4d5c94 MT |
150 | struct mm_struct *mm; |
151 | struct mutex mutex; | |
152 | unsigned acked_features; | |
153 | struct vhost_virtqueue *vqs; | |
154 | int nvqs; | |
155 | struct file *log_file; | |
156 | struct eventfd_ctx *log_ctx; | |
c23f3445 TH |
157 | spinlock_t work_lock; |
158 | struct list_head work_list; | |
159 | struct task_struct *worker; | |
3a4d5c94 MT |
160 | }; |
161 | ||
162 | long vhost_dev_init(struct vhost_dev *, struct vhost_virtqueue *vqs, int nvqs); | |
163 | long vhost_dev_check_owner(struct vhost_dev *); | |
164 | long vhost_dev_reset_owner(struct vhost_dev *); | |
ea5d4046 | 165 | void vhost_dev_cleanup(struct vhost_dev *, bool locked); |
b211616d | 166 | void vhost_dev_stop(struct vhost_dev *); |
3a4d5c94 MT |
167 | long vhost_dev_ioctl(struct vhost_dev *, unsigned int ioctl, unsigned long arg); |
168 | int vhost_vq_access_ok(struct vhost_virtqueue *vq); | |
169 | int vhost_log_access_ok(struct vhost_dev *); | |
170 | ||
d5675bd2 MT |
171 | int vhost_get_vq_desc(struct vhost_dev *, struct vhost_virtqueue *, |
172 | struct iovec iov[], unsigned int iov_count, | |
173 | unsigned int *out_num, unsigned int *in_num, | |
174 | struct vhost_log *log, unsigned int *log_num); | |
8dd014ad | 175 | void vhost_discard_vq_desc(struct vhost_virtqueue *, int n); |
3a4d5c94 | 176 | |
f59281da | 177 | int vhost_init_used(struct vhost_virtqueue *); |
3a4d5c94 | 178 | int vhost_add_used(struct vhost_virtqueue *, unsigned int head, int len); |
8dd014ad DS |
179 | int vhost_add_used_n(struct vhost_virtqueue *, struct vring_used_elem *heads, |
180 | unsigned count); | |
3a4d5c94 | 181 | void vhost_add_used_and_signal(struct vhost_dev *, struct vhost_virtqueue *, |
8dd014ad DS |
182 | unsigned int id, int len); |
183 | void vhost_add_used_and_signal_n(struct vhost_dev *, struct vhost_virtqueue *, | |
184 | struct vring_used_elem *heads, unsigned count); | |
185 | void vhost_signal(struct vhost_dev *, struct vhost_virtqueue *); | |
8ea8cf89 MT |
186 | void vhost_disable_notify(struct vhost_dev *, struct vhost_virtqueue *); |
187 | bool vhost_enable_notify(struct vhost_dev *, struct vhost_virtqueue *); | |
3a4d5c94 MT |
188 | |
189 | int vhost_log_write(struct vhost_virtqueue *vq, struct vhost_log *log, | |
190 | unsigned int log_num, u64 len); | |
191 | ||
3a4d5c94 MT |
192 | #define vq_err(vq, fmt, ...) do { \ |
193 | pr_debug(pr_fmt(fmt), ##__VA_ARGS__); \ | |
194 | if ((vq)->error_ctx) \ | |
195 | eventfd_signal((vq)->error_ctx, 1);\ | |
196 | } while (0) | |
197 | ||
198 | enum { | |
8ea8cf89 MT |
199 | VHOST_FEATURES = (1ULL << VIRTIO_F_NOTIFY_ON_EMPTY) | |
200 | (1ULL << VIRTIO_RING_F_INDIRECT_DESC) | | |
201 | (1ULL << VIRTIO_RING_F_EVENT_IDX) | | |
0dd05a3b SH |
202 | (1ULL << VHOST_F_LOG_ALL), |
203 | VHOST_NET_FEATURES = VHOST_FEATURES | | |
8ea8cf89 MT |
204 | (1ULL << VHOST_NET_F_VIRTIO_NET_HDR) | |
205 | (1ULL << VIRTIO_NET_F_MRG_RXBUF), | |
3a4d5c94 MT |
206 | }; |
207 | ||
208 | static inline int vhost_has_feature(struct vhost_dev *dev, int bit) | |
209 | { | |
28457ee6 AB |
210 | unsigned acked_features; |
211 | ||
5e18247b MT |
212 | /* TODO: check that we are running from vhost_worker or dev mutex is |
213 | * held? */ | |
214 | acked_features = rcu_dereference_index_check(dev->acked_features, 1); | |
3a4d5c94 MT |
215 | return acked_features & (1 << bit); |
216 | } | |
217 | ||
bab632d6 MT |
218 | void vhost_enable_zcopy(int vq); |
219 | ||
3a4d5c94 | 220 | #endif |