vringh_test.c 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741
  1. /* Simple test of virtio code, entirely in userpsace. */
  2. #define _GNU_SOURCE
  3. #include <sched.h>
  4. #include <err.h>
  5. #include <linux/kernel.h>
  6. #include <linux/err.h>
  7. #include <linux/virtio.h>
  8. #include <linux/vringh.h>
  9. #include <linux/virtio_ring.h>
  10. #include <linux/uaccess.h>
  11. #include <sys/types.h>
  12. #include <sys/stat.h>
  13. #include <sys/mman.h>
  14. #include <sys/wait.h>
  15. #include <fcntl.h>
  16. #define USER_MEM (1024*1024)
  17. void *__user_addr_min, *__user_addr_max;
  18. void *__kmalloc_fake, *__kfree_ignore_start, *__kfree_ignore_end;
  19. static u64 user_addr_offset;
  20. #define RINGSIZE 256
  21. #define ALIGN 4096
  22. static void never_notify_host(struct virtqueue *vq)
  23. {
  24. abort();
  25. }
  26. static void never_callback_guest(struct virtqueue *vq)
  27. {
  28. abort();
  29. }
  30. static bool getrange_iov(struct vringh *vrh, u64 addr, struct vringh_range *r)
  31. {
  32. if (addr < (u64)(unsigned long)__user_addr_min - user_addr_offset)
  33. return false;
  34. if (addr >= (u64)(unsigned long)__user_addr_max - user_addr_offset)
  35. return false;
  36. r->start = (u64)(unsigned long)__user_addr_min - user_addr_offset;
  37. r->end_incl = (u64)(unsigned long)__user_addr_max - 1 - user_addr_offset;
  38. r->offset = user_addr_offset;
  39. return true;
  40. }
  41. /* We return single byte ranges. */
  42. static bool getrange_slow(struct vringh *vrh, u64 addr, struct vringh_range *r)
  43. {
  44. if (addr < (u64)(unsigned long)__user_addr_min - user_addr_offset)
  45. return false;
  46. if (addr >= (u64)(unsigned long)__user_addr_max - user_addr_offset)
  47. return false;
  48. r->start = addr;
  49. r->end_incl = r->start;
  50. r->offset = user_addr_offset;
  51. return true;
  52. }
  53. struct guest_virtio_device {
  54. struct virtio_device vdev;
  55. int to_host_fd;
  56. unsigned long notifies;
  57. };
  58. static void parallel_notify_host(struct virtqueue *vq)
  59. {
  60. struct guest_virtio_device *gvdev;
  61. gvdev = container_of(vq->vdev, struct guest_virtio_device, vdev);
  62. write(gvdev->to_host_fd, "", 1);
  63. gvdev->notifies++;
  64. }
  65. static void no_notify_host(struct virtqueue *vq)
  66. {
  67. }
  68. #define NUM_XFERS (10000000)
  69. /* We aim for two "distant" cpus. */
  70. static void find_cpus(unsigned int *first, unsigned int *last)
  71. {
  72. unsigned int i;
  73. *first = -1U;
  74. *last = 0;
  75. for (i = 0; i < 4096; i++) {
  76. cpu_set_t set;
  77. CPU_ZERO(&set);
  78. CPU_SET(i, &set);
  79. if (sched_setaffinity(getpid(), sizeof(set), &set) == 0) {
  80. if (i < *first)
  81. *first = i;
  82. if (i > *last)
  83. *last = i;
  84. }
  85. }
  86. }
  87. /* Opencoded version for fast mode */
  88. static inline int vringh_get_head(struct vringh *vrh, u16 *head)
  89. {
  90. u16 avail_idx, i;
  91. int err;
  92. err = get_user(avail_idx, &vrh->vring.avail->idx);
  93. if (err)
  94. return err;
  95. if (vrh->last_avail_idx == avail_idx)
  96. return 0;
  97. /* Only get avail ring entries after they have been exposed by guest. */
  98. virtio_rmb(vrh->weak_barriers);
  99. i = vrh->last_avail_idx & (vrh->vring.num - 1);
  100. err = get_user(*head, &vrh->vring.avail->ring[i]);
  101. if (err)
  102. return err;
  103. vrh->last_avail_idx++;
  104. return 1;
  105. }
  106. static int parallel_test(unsigned long features,
  107. bool (*getrange)(struct vringh *vrh,
  108. u64 addr, struct vringh_range *r),
  109. bool fast_vringh)
  110. {
  111. void *host_map, *guest_map;
  112. int fd, mapsize, to_guest[2], to_host[2];
  113. unsigned long xfers = 0, notifies = 0, receives = 0;
  114. unsigned int first_cpu, last_cpu;
  115. cpu_set_t cpu_set;
  116. char buf[128];
  117. /* Create real file to mmap. */
  118. fd = open("/tmp/vringh_test-file", O_RDWR|O_CREAT|O_TRUNC, 0600);
  119. if (fd < 0)
  120. err(1, "Opening /tmp/vringh_test-file");
  121. /* Extra room at the end for some data, and indirects */
  122. mapsize = vring_size(RINGSIZE, ALIGN)
  123. + RINGSIZE * 2 * sizeof(int)
  124. + RINGSIZE * 6 * sizeof(struct vring_desc);
  125. mapsize = (mapsize + getpagesize() - 1) & ~(getpagesize() - 1);
  126. ftruncate(fd, mapsize);
  127. /* Parent and child use separate addresses, to check our mapping logic! */
  128. host_map = mmap(NULL, mapsize, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0);
  129. guest_map = mmap(NULL, mapsize, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0);
  130. pipe(to_guest);
  131. pipe(to_host);
  132. CPU_ZERO(&cpu_set);
  133. find_cpus(&first_cpu, &last_cpu);
  134. printf("Using CPUS %u and %u\n", first_cpu, last_cpu);
  135. fflush(stdout);
  136. if (fork() != 0) {
  137. struct vringh vrh;
  138. int status, err, rlen = 0;
  139. char rbuf[5];
  140. /* We are the host: never access guest addresses! */
  141. munmap(guest_map, mapsize);
  142. __user_addr_min = host_map;
  143. __user_addr_max = __user_addr_min + mapsize;
  144. user_addr_offset = host_map - guest_map;
  145. assert(user_addr_offset);
  146. close(to_guest[0]);
  147. close(to_host[1]);
  148. vring_init(&vrh.vring, RINGSIZE, host_map, ALIGN);
  149. vringh_init_user(&vrh, features, RINGSIZE, true,
  150. vrh.vring.desc, vrh.vring.avail, vrh.vring.used);
  151. CPU_SET(first_cpu, &cpu_set);
  152. if (sched_setaffinity(getpid(), sizeof(cpu_set), &cpu_set))
  153. errx(1, "Could not set affinity to cpu %u", first_cpu);
  154. while (xfers < NUM_XFERS) {
  155. struct iovec host_riov[2], host_wiov[2];
  156. struct vringh_iov riov, wiov;
  157. u16 head, written;
  158. if (fast_vringh) {
  159. for (;;) {
  160. err = vringh_get_head(&vrh, &head);
  161. if (err != 0)
  162. break;
  163. err = vringh_need_notify_user(&vrh);
  164. if (err < 0)
  165. errx(1, "vringh_need_notify_user: %i",
  166. err);
  167. if (err) {
  168. write(to_guest[1], "", 1);
  169. notifies++;
  170. }
  171. }
  172. if (err != 1)
  173. errx(1, "vringh_get_head");
  174. written = 0;
  175. goto complete;
  176. } else {
  177. vringh_iov_init(&riov,
  178. host_riov,
  179. ARRAY_SIZE(host_riov));
  180. vringh_iov_init(&wiov,
  181. host_wiov,
  182. ARRAY_SIZE(host_wiov));
  183. err = vringh_getdesc_user(&vrh, &riov, &wiov,
  184. getrange, &head);
  185. }
  186. if (err == 0) {
  187. err = vringh_need_notify_user(&vrh);
  188. if (err < 0)
  189. errx(1, "vringh_need_notify_user: %i",
  190. err);
  191. if (err) {
  192. write(to_guest[1], "", 1);
  193. notifies++;
  194. }
  195. if (!vringh_notify_enable_user(&vrh))
  196. continue;
  197. /* Swallow all notifies at once. */
  198. if (read(to_host[0], buf, sizeof(buf)) < 1)
  199. break;
  200. vringh_notify_disable_user(&vrh);
  201. receives++;
  202. continue;
  203. }
  204. if (err != 1)
  205. errx(1, "vringh_getdesc_user: %i", err);
  206. /* We simply copy bytes. */
  207. if (riov.used) {
  208. rlen = vringh_iov_pull_user(&riov, rbuf,
  209. sizeof(rbuf));
  210. if (rlen != 4)
  211. errx(1, "vringh_iov_pull_user: %i",
  212. rlen);
  213. assert(riov.i == riov.used);
  214. written = 0;
  215. } else {
  216. err = vringh_iov_push_user(&wiov, rbuf, rlen);
  217. if (err != rlen)
  218. errx(1, "vringh_iov_push_user: %i",
  219. err);
  220. assert(wiov.i == wiov.used);
  221. written = err;
  222. }
  223. complete:
  224. xfers++;
  225. err = vringh_complete_user(&vrh, head, written);
  226. if (err != 0)
  227. errx(1, "vringh_complete_user: %i", err);
  228. }
  229. err = vringh_need_notify_user(&vrh);
  230. if (err < 0)
  231. errx(1, "vringh_need_notify_user: %i", err);
  232. if (err) {
  233. write(to_guest[1], "", 1);
  234. notifies++;
  235. }
  236. wait(&status);
  237. if (!WIFEXITED(status))
  238. errx(1, "Child died with signal %i?", WTERMSIG(status));
  239. if (WEXITSTATUS(status) != 0)
  240. errx(1, "Child exited %i?", WEXITSTATUS(status));
  241. printf("Host: notified %lu, pinged %lu\n", notifies, receives);
  242. return 0;
  243. } else {
  244. struct guest_virtio_device gvdev;
  245. struct virtqueue *vq;
  246. unsigned int *data;
  247. struct vring_desc *indirects;
  248. unsigned int finished = 0;
  249. /* We pass sg[]s pointing into here, but we need RINGSIZE+1 */
  250. data = guest_map + vring_size(RINGSIZE, ALIGN);
  251. indirects = (void *)data + (RINGSIZE + 1) * 2 * sizeof(int);
  252. /* We are the guest. */
  253. munmap(host_map, mapsize);
  254. close(to_guest[1]);
  255. close(to_host[0]);
  256. gvdev.vdev.features[0] = features;
  257. gvdev.to_host_fd = to_host[1];
  258. gvdev.notifies = 0;
  259. CPU_SET(first_cpu, &cpu_set);
  260. if (sched_setaffinity(getpid(), sizeof(cpu_set), &cpu_set))
  261. err(1, "Could not set affinity to cpu %u", first_cpu);
  262. vq = vring_new_virtqueue(0, RINGSIZE, ALIGN, &gvdev.vdev, true,
  263. guest_map, fast_vringh ? no_notify_host
  264. : parallel_notify_host,
  265. never_callback_guest, "guest vq");
  266. /* Don't kfree indirects. */
  267. __kfree_ignore_start = indirects;
  268. __kfree_ignore_end = indirects + RINGSIZE * 6;
  269. while (xfers < NUM_XFERS) {
  270. struct scatterlist sg[4];
  271. unsigned int num_sg, len;
  272. int *dbuf, err;
  273. bool output = !(xfers % 2);
  274. /* Consume bufs. */
  275. while ((dbuf = virtqueue_get_buf(vq, &len)) != NULL) {
  276. if (len == 4)
  277. assert(*dbuf == finished - 1);
  278. else if (!fast_vringh)
  279. assert(*dbuf == finished);
  280. finished++;
  281. }
  282. /* Produce a buffer. */
  283. dbuf = data + (xfers % (RINGSIZE + 1));
  284. if (output)
  285. *dbuf = xfers;
  286. else
  287. *dbuf = -1;
  288. switch ((xfers / sizeof(*dbuf)) % 4) {
  289. case 0:
  290. /* Nasty three-element sg list. */
  291. sg_init_table(sg, num_sg = 3);
  292. sg_set_buf(&sg[0], (void *)dbuf, 1);
  293. sg_set_buf(&sg[1], (void *)dbuf + 1, 2);
  294. sg_set_buf(&sg[2], (void *)dbuf + 3, 1);
  295. break;
  296. case 1:
  297. sg_init_table(sg, num_sg = 2);
  298. sg_set_buf(&sg[0], (void *)dbuf, 1);
  299. sg_set_buf(&sg[1], (void *)dbuf + 1, 3);
  300. break;
  301. case 2:
  302. sg_init_table(sg, num_sg = 1);
  303. sg_set_buf(&sg[0], (void *)dbuf, 4);
  304. break;
  305. case 3:
  306. sg_init_table(sg, num_sg = 4);
  307. sg_set_buf(&sg[0], (void *)dbuf, 1);
  308. sg_set_buf(&sg[1], (void *)dbuf + 1, 1);
  309. sg_set_buf(&sg[2], (void *)dbuf + 2, 1);
  310. sg_set_buf(&sg[3], (void *)dbuf + 3, 1);
  311. break;
  312. }
  313. /* May allocate an indirect, so force it to allocate
  314. * user addr */
  315. __kmalloc_fake = indirects + (xfers % RINGSIZE) * 4;
  316. if (output)
  317. err = virtqueue_add_outbuf(vq, sg, num_sg, dbuf,
  318. GFP_KERNEL);
  319. else
  320. err = virtqueue_add_inbuf(vq, sg, num_sg,
  321. dbuf, GFP_KERNEL);
  322. if (err == -ENOSPC) {
  323. if (!virtqueue_enable_cb_delayed(vq))
  324. continue;
  325. /* Swallow all notifies at once. */
  326. if (read(to_guest[0], buf, sizeof(buf)) < 1)
  327. break;
  328. receives++;
  329. virtqueue_disable_cb(vq);
  330. continue;
  331. }
  332. if (err)
  333. errx(1, "virtqueue_add_in/outbuf: %i", err);
  334. xfers++;
  335. virtqueue_kick(vq);
  336. }
  337. /* Any extra? */
  338. while (finished != xfers) {
  339. int *dbuf;
  340. unsigned int len;
  341. /* Consume bufs. */
  342. dbuf = virtqueue_get_buf(vq, &len);
  343. if (dbuf) {
  344. if (len == 4)
  345. assert(*dbuf == finished - 1);
  346. else
  347. assert(len == 0);
  348. finished++;
  349. continue;
  350. }
  351. if (!virtqueue_enable_cb_delayed(vq))
  352. continue;
  353. if (read(to_guest[0], buf, sizeof(buf)) < 1)
  354. break;
  355. receives++;
  356. virtqueue_disable_cb(vq);
  357. }
  358. printf("Guest: notified %lu, pinged %lu\n",
  359. gvdev.notifies, receives);
  360. vring_del_virtqueue(vq);
  361. return 0;
  362. }
  363. }
  364. int main(int argc, char *argv[])
  365. {
  366. struct virtio_device vdev;
  367. struct virtqueue *vq;
  368. struct vringh vrh;
  369. struct scatterlist guest_sg[RINGSIZE], *sgs[2];
  370. struct iovec host_riov[2], host_wiov[2];
  371. struct vringh_iov riov, wiov;
  372. struct vring_used_elem used[RINGSIZE];
  373. char buf[28];
  374. u16 head;
  375. int err;
  376. unsigned i;
  377. void *ret;
  378. bool (*getrange)(struct vringh *vrh, u64 addr, struct vringh_range *r);
  379. bool fast_vringh = false, parallel = false;
  380. getrange = getrange_iov;
  381. vdev.features[0] = 0;
  382. while (argv[1]) {
  383. if (strcmp(argv[1], "--indirect") == 0)
  384. vdev.features[0] |= (1 << VIRTIO_RING_F_INDIRECT_DESC);
  385. else if (strcmp(argv[1], "--eventidx") == 0)
  386. vdev.features[0] |= (1 << VIRTIO_RING_F_EVENT_IDX);
  387. else if (strcmp(argv[1], "--slow-range") == 0)
  388. getrange = getrange_slow;
  389. else if (strcmp(argv[1], "--fast-vringh") == 0)
  390. fast_vringh = true;
  391. else if (strcmp(argv[1], "--parallel") == 0)
  392. parallel = true;
  393. else
  394. errx(1, "Unknown arg %s", argv[1]);
  395. argv++;
  396. }
  397. if (parallel)
  398. return parallel_test(vdev.features[0], getrange, fast_vringh);
  399. if (posix_memalign(&__user_addr_min, PAGE_SIZE, USER_MEM) != 0)
  400. abort();
  401. __user_addr_max = __user_addr_min + USER_MEM;
  402. memset(__user_addr_min, 0, vring_size(RINGSIZE, ALIGN));
  403. /* Set up guest side. */
  404. vq = vring_new_virtqueue(0, RINGSIZE, ALIGN, &vdev, true,
  405. __user_addr_min,
  406. never_notify_host, never_callback_guest,
  407. "guest vq");
  408. /* Set up host side. */
  409. vring_init(&vrh.vring, RINGSIZE, __user_addr_min, ALIGN);
  410. vringh_init_user(&vrh, vdev.features[0], RINGSIZE, true,
  411. vrh.vring.desc, vrh.vring.avail, vrh.vring.used);
  412. /* No descriptor to get yet... */
  413. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  414. if (err != 0)
  415. errx(1, "vringh_getdesc_user: %i", err);
  416. /* Guest puts in a descriptor. */
  417. memcpy(__user_addr_max - 1, "a", 1);
  418. sg_init_table(guest_sg, 1);
  419. sg_set_buf(&guest_sg[0], __user_addr_max - 1, 1);
  420. sg_init_table(guest_sg+1, 1);
  421. sg_set_buf(&guest_sg[1], __user_addr_max - 3, 2);
  422. sgs[0] = &guest_sg[0];
  423. sgs[1] = &guest_sg[1];
  424. /* May allocate an indirect, so force it to allocate user addr */
  425. __kmalloc_fake = __user_addr_min + vring_size(RINGSIZE, ALIGN);
  426. err = virtqueue_add_sgs(vq, sgs, 1, 1, &err, GFP_KERNEL);
  427. if (err)
  428. errx(1, "virtqueue_add_sgs: %i", err);
  429. __kmalloc_fake = NULL;
  430. /* Host retreives it. */
  431. vringh_iov_init(&riov, host_riov, ARRAY_SIZE(host_riov));
  432. vringh_iov_init(&wiov, host_wiov, ARRAY_SIZE(host_wiov));
  433. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  434. if (err != 1)
  435. errx(1, "vringh_getdesc_user: %i", err);
  436. assert(riov.used == 1);
  437. assert(riov.iov[0].iov_base == __user_addr_max - 1);
  438. assert(riov.iov[0].iov_len == 1);
  439. if (getrange != getrange_slow) {
  440. assert(wiov.used == 1);
  441. assert(wiov.iov[0].iov_base == __user_addr_max - 3);
  442. assert(wiov.iov[0].iov_len == 2);
  443. } else {
  444. assert(wiov.used == 2);
  445. assert(wiov.iov[0].iov_base == __user_addr_max - 3);
  446. assert(wiov.iov[0].iov_len == 1);
  447. assert(wiov.iov[1].iov_base == __user_addr_max - 2);
  448. assert(wiov.iov[1].iov_len == 1);
  449. }
  450. err = vringh_iov_pull_user(&riov, buf, 5);
  451. if (err != 1)
  452. errx(1, "vringh_iov_pull_user: %i", err);
  453. assert(buf[0] == 'a');
  454. assert(riov.i == 1);
  455. assert(vringh_iov_pull_user(&riov, buf, 5) == 0);
  456. memcpy(buf, "bcdef", 5);
  457. err = vringh_iov_push_user(&wiov, buf, 5);
  458. if (err != 2)
  459. errx(1, "vringh_iov_push_user: %i", err);
  460. assert(memcmp(__user_addr_max - 3, "bc", 2) == 0);
  461. assert(wiov.i == wiov.used);
  462. assert(vringh_iov_push_user(&wiov, buf, 5) == 0);
  463. /* Host is done. */
  464. err = vringh_complete_user(&vrh, head, err);
  465. if (err != 0)
  466. errx(1, "vringh_complete_user: %i", err);
  467. /* Guest should see used token now. */
  468. __kfree_ignore_start = __user_addr_min + vring_size(RINGSIZE, ALIGN);
  469. __kfree_ignore_end = __kfree_ignore_start + 1;
  470. ret = virtqueue_get_buf(vq, &i);
  471. if (ret != &err)
  472. errx(1, "virtqueue_get_buf: %p", ret);
  473. assert(i == 2);
  474. /* Guest puts in a huge descriptor. */
  475. sg_init_table(guest_sg, RINGSIZE);
  476. for (i = 0; i < RINGSIZE; i++) {
  477. sg_set_buf(&guest_sg[i],
  478. __user_addr_max - USER_MEM/4, USER_MEM/4);
  479. }
  480. /* Fill contents with recognisable garbage. */
  481. for (i = 0; i < USER_MEM/4; i++)
  482. ((char *)__user_addr_max - USER_MEM/4)[i] = i;
  483. /* This will allocate an indirect, so force it to allocate user addr */
  484. __kmalloc_fake = __user_addr_min + vring_size(RINGSIZE, ALIGN);
  485. err = virtqueue_add_outbuf(vq, guest_sg, RINGSIZE, &err, GFP_KERNEL);
  486. if (err)
  487. errx(1, "virtqueue_add_outbuf (large): %i", err);
  488. __kmalloc_fake = NULL;
  489. /* Host picks it up (allocates new iov). */
  490. vringh_iov_init(&riov, host_riov, ARRAY_SIZE(host_riov));
  491. vringh_iov_init(&wiov, host_wiov, ARRAY_SIZE(host_wiov));
  492. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  493. if (err != 1)
  494. errx(1, "vringh_getdesc_user: %i", err);
  495. assert(riov.max_num & VRINGH_IOV_ALLOCATED);
  496. assert(riov.iov != host_riov);
  497. if (getrange != getrange_slow)
  498. assert(riov.used == RINGSIZE);
  499. else
  500. assert(riov.used == RINGSIZE * USER_MEM/4);
  501. assert(!(wiov.max_num & VRINGH_IOV_ALLOCATED));
  502. assert(wiov.used == 0);
  503. /* Pull data back out (in odd chunks), should be as expected. */
  504. for (i = 0; i < RINGSIZE * USER_MEM/4; i += 3) {
  505. err = vringh_iov_pull_user(&riov, buf, 3);
  506. if (err != 3 && i + err != RINGSIZE * USER_MEM/4)
  507. errx(1, "vringh_iov_pull_user large: %i", err);
  508. assert(buf[0] == (char)i);
  509. assert(err < 2 || buf[1] == (char)(i + 1));
  510. assert(err < 3 || buf[2] == (char)(i + 2));
  511. }
  512. assert(riov.i == riov.used);
  513. vringh_iov_cleanup(&riov);
  514. vringh_iov_cleanup(&wiov);
  515. /* Complete using multi interface, just because we can. */
  516. used[0].id = head;
  517. used[0].len = 0;
  518. err = vringh_complete_multi_user(&vrh, used, 1);
  519. if (err)
  520. errx(1, "vringh_complete_multi_user(1): %i", err);
  521. /* Free up those descriptors. */
  522. ret = virtqueue_get_buf(vq, &i);
  523. if (ret != &err)
  524. errx(1, "virtqueue_get_buf: %p", ret);
  525. /* Add lots of descriptors. */
  526. sg_init_table(guest_sg, 1);
  527. sg_set_buf(&guest_sg[0], __user_addr_max - 1, 1);
  528. for (i = 0; i < RINGSIZE; i++) {
  529. err = virtqueue_add_outbuf(vq, guest_sg, 1, &err, GFP_KERNEL);
  530. if (err)
  531. errx(1, "virtqueue_add_outbuf (multiple): %i", err);
  532. }
  533. /* Now get many, and consume them all at once. */
  534. vringh_iov_init(&riov, host_riov, ARRAY_SIZE(host_riov));
  535. vringh_iov_init(&wiov, host_wiov, ARRAY_SIZE(host_wiov));
  536. for (i = 0; i < RINGSIZE; i++) {
  537. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  538. if (err != 1)
  539. errx(1, "vringh_getdesc_user: %i", err);
  540. used[i].id = head;
  541. used[i].len = 0;
  542. }
  543. /* Make sure it wraps around ring, to test! */
  544. assert(vrh.vring.used->idx % RINGSIZE != 0);
  545. err = vringh_complete_multi_user(&vrh, used, RINGSIZE);
  546. if (err)
  547. errx(1, "vringh_complete_multi_user: %i", err);
  548. /* Free those buffers. */
  549. for (i = 0; i < RINGSIZE; i++) {
  550. unsigned len;
  551. assert(virtqueue_get_buf(vq, &len) != NULL);
  552. }
  553. /* Test weird (but legal!) indirect. */
  554. if (vdev.features[0] & (1 << VIRTIO_RING_F_INDIRECT_DESC)) {
  555. char *data = __user_addr_max - USER_MEM/4;
  556. struct vring_desc *d = __user_addr_max - USER_MEM/2;
  557. struct vring vring;
  558. /* Force creation of direct, which we modify. */
  559. vdev.features[0] &= ~(1 << VIRTIO_RING_F_INDIRECT_DESC);
  560. vq = vring_new_virtqueue(0, RINGSIZE, ALIGN, &vdev, true,
  561. __user_addr_min,
  562. never_notify_host,
  563. never_callback_guest,
  564. "guest vq");
  565. sg_init_table(guest_sg, 4);
  566. sg_set_buf(&guest_sg[0], d, sizeof(*d)*2);
  567. sg_set_buf(&guest_sg[1], d + 2, sizeof(*d)*1);
  568. sg_set_buf(&guest_sg[2], data + 6, 4);
  569. sg_set_buf(&guest_sg[3], d + 3, sizeof(*d)*3);
  570. err = virtqueue_add_outbuf(vq, guest_sg, 4, &err, GFP_KERNEL);
  571. if (err)
  572. errx(1, "virtqueue_add_outbuf (indirect): %i", err);
  573. vring_init(&vring, RINGSIZE, __user_addr_min, ALIGN);
  574. /* They're used in order, but double-check... */
  575. assert(vring.desc[0].addr == (unsigned long)d);
  576. assert(vring.desc[1].addr == (unsigned long)(d+2));
  577. assert(vring.desc[2].addr == (unsigned long)data + 6);
  578. assert(vring.desc[3].addr == (unsigned long)(d+3));
  579. vring.desc[0].flags |= VRING_DESC_F_INDIRECT;
  580. vring.desc[1].flags |= VRING_DESC_F_INDIRECT;
  581. vring.desc[3].flags |= VRING_DESC_F_INDIRECT;
  582. /* First indirect */
  583. d[0].addr = (unsigned long)data;
  584. d[0].len = 1;
  585. d[0].flags = VRING_DESC_F_NEXT;
  586. d[0].next = 1;
  587. d[1].addr = (unsigned long)data + 1;
  588. d[1].len = 2;
  589. d[1].flags = 0;
  590. /* Second indirect */
  591. d[2].addr = (unsigned long)data + 3;
  592. d[2].len = 3;
  593. d[2].flags = 0;
  594. /* Third indirect */
  595. d[3].addr = (unsigned long)data + 10;
  596. d[3].len = 5;
  597. d[3].flags = VRING_DESC_F_NEXT;
  598. d[3].next = 1;
  599. d[4].addr = (unsigned long)data + 15;
  600. d[4].len = 6;
  601. d[4].flags = VRING_DESC_F_NEXT;
  602. d[4].next = 2;
  603. d[5].addr = (unsigned long)data + 21;
  604. d[5].len = 7;
  605. d[5].flags = 0;
  606. /* Host picks it up (allocates new iov). */
  607. vringh_iov_init(&riov, host_riov, ARRAY_SIZE(host_riov));
  608. vringh_iov_init(&wiov, host_wiov, ARRAY_SIZE(host_wiov));
  609. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  610. if (err != 1)
  611. errx(1, "vringh_getdesc_user: %i", err);
  612. if (head != 0)
  613. errx(1, "vringh_getdesc_user: head %i not 0", head);
  614. assert(riov.max_num & VRINGH_IOV_ALLOCATED);
  615. if (getrange != getrange_slow)
  616. assert(riov.used == 7);
  617. else
  618. assert(riov.used == 28);
  619. err = vringh_iov_pull_user(&riov, buf, 29);
  620. assert(err == 28);
  621. /* Data should be linear. */
  622. for (i = 0; i < err; i++)
  623. assert(buf[i] == i);
  624. vringh_iov_cleanup(&riov);
  625. }
  626. /* Don't leak memory... */
  627. vring_del_virtqueue(vq);
  628. free(__user_addr_min);
  629. return 0;
  630. }