vringh_test.c 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746
  1. /* Simple test of virtio code, entirely in userpsace. */
  2. #define _GNU_SOURCE
  3. #include <sched.h>
  4. #include <err.h>
  5. #include <linux/kernel.h>
  6. #include <linux/err.h>
  7. #include <linux/virtio.h>
  8. #include <linux/vringh.h>
  9. #include <linux/virtio_ring.h>
  10. #include <linux/uaccess.h>
  11. #include <sys/types.h>
  12. #include <sys/stat.h>
  13. #include <sys/mman.h>
  14. #include <sys/wait.h>
  15. #include <fcntl.h>
  16. #define USER_MEM (1024*1024)
  17. void *__user_addr_min, *__user_addr_max;
  18. void *__kmalloc_fake, *__kfree_ignore_start, *__kfree_ignore_end;
  19. static u64 user_addr_offset;
  20. #define RINGSIZE 256
  21. #define ALIGN 4096
  22. static bool never_notify_host(struct virtqueue *vq)
  23. {
  24. abort();
  25. }
  26. static void never_callback_guest(struct virtqueue *vq)
  27. {
  28. abort();
  29. }
  30. static bool getrange_iov(struct vringh *vrh, u64 addr, struct vringh_range *r)
  31. {
  32. if (addr < (u64)(unsigned long)__user_addr_min - user_addr_offset)
  33. return false;
  34. if (addr >= (u64)(unsigned long)__user_addr_max - user_addr_offset)
  35. return false;
  36. r->start = (u64)(unsigned long)__user_addr_min - user_addr_offset;
  37. r->end_incl = (u64)(unsigned long)__user_addr_max - 1 - user_addr_offset;
  38. r->offset = user_addr_offset;
  39. return true;
  40. }
  41. /* We return single byte ranges. */
  42. static bool getrange_slow(struct vringh *vrh, u64 addr, struct vringh_range *r)
  43. {
  44. if (addr < (u64)(unsigned long)__user_addr_min - user_addr_offset)
  45. return false;
  46. if (addr >= (u64)(unsigned long)__user_addr_max - user_addr_offset)
  47. return false;
  48. r->start = addr;
  49. r->end_incl = r->start;
  50. r->offset = user_addr_offset;
  51. return true;
  52. }
  53. struct guest_virtio_device {
  54. struct virtio_device vdev;
  55. int to_host_fd;
  56. unsigned long notifies;
  57. };
  58. static bool parallel_notify_host(struct virtqueue *vq)
  59. {
  60. int rc;
  61. struct guest_virtio_device *gvdev;
  62. gvdev = container_of(vq->vdev, struct guest_virtio_device, vdev);
  63. rc = write(gvdev->to_host_fd, "", 1);
  64. if (rc < 0)
  65. return false;
  66. gvdev->notifies++;
  67. return true;
  68. }
  69. static bool no_notify_host(struct virtqueue *vq)
  70. {
  71. return true;
  72. }
  73. #define NUM_XFERS (10000000)
  74. /* We aim for two "distant" cpus. */
  75. static void find_cpus(unsigned int *first, unsigned int *last)
  76. {
  77. unsigned int i;
  78. *first = -1U;
  79. *last = 0;
  80. for (i = 0; i < 4096; i++) {
  81. cpu_set_t set;
  82. CPU_ZERO(&set);
  83. CPU_SET(i, &set);
  84. if (sched_setaffinity(getpid(), sizeof(set), &set) == 0) {
  85. if (i < *first)
  86. *first = i;
  87. if (i > *last)
  88. *last = i;
  89. }
  90. }
  91. }
  92. /* Opencoded version for fast mode */
  93. static inline int vringh_get_head(struct vringh *vrh, u16 *head)
  94. {
  95. u16 avail_idx, i;
  96. int err;
  97. err = get_user(avail_idx, &vrh->vring.avail->idx);
  98. if (err)
  99. return err;
  100. if (vrh->last_avail_idx == avail_idx)
  101. return 0;
  102. /* Only get avail ring entries after they have been exposed by guest. */
  103. virtio_rmb(vrh->weak_barriers);
  104. i = vrh->last_avail_idx & (vrh->vring.num - 1);
  105. err = get_user(*head, &vrh->vring.avail->ring[i]);
  106. if (err)
  107. return err;
  108. vrh->last_avail_idx++;
  109. return 1;
  110. }
  111. static int parallel_test(unsigned long features,
  112. bool (*getrange)(struct vringh *vrh,
  113. u64 addr, struct vringh_range *r),
  114. bool fast_vringh)
  115. {
  116. void *host_map, *guest_map;
  117. int fd, mapsize, to_guest[2], to_host[2];
  118. unsigned long xfers = 0, notifies = 0, receives = 0;
  119. unsigned int first_cpu, last_cpu;
  120. cpu_set_t cpu_set;
  121. char buf[128];
  122. /* Create real file to mmap. */
  123. fd = open("/tmp/vringh_test-file", O_RDWR|O_CREAT|O_TRUNC, 0600);
  124. if (fd < 0)
  125. err(1, "Opening /tmp/vringh_test-file");
  126. /* Extra room at the end for some data, and indirects */
  127. mapsize = vring_size(RINGSIZE, ALIGN)
  128. + RINGSIZE * 2 * sizeof(int)
  129. + RINGSIZE * 6 * sizeof(struct vring_desc);
  130. mapsize = (mapsize + getpagesize() - 1) & ~(getpagesize() - 1);
  131. ftruncate(fd, mapsize);
  132. /* Parent and child use separate addresses, to check our mapping logic! */
  133. host_map = mmap(NULL, mapsize, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0);
  134. guest_map = mmap(NULL, mapsize, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0);
  135. pipe(to_guest);
  136. pipe(to_host);
  137. CPU_ZERO(&cpu_set);
  138. find_cpus(&first_cpu, &last_cpu);
  139. printf("Using CPUS %u and %u\n", first_cpu, last_cpu);
  140. fflush(stdout);
  141. if (fork() != 0) {
  142. struct vringh vrh;
  143. int status, err, rlen = 0;
  144. char rbuf[5];
  145. /* We are the host: never access guest addresses! */
  146. munmap(guest_map, mapsize);
  147. __user_addr_min = host_map;
  148. __user_addr_max = __user_addr_min + mapsize;
  149. user_addr_offset = host_map - guest_map;
  150. assert(user_addr_offset);
  151. close(to_guest[0]);
  152. close(to_host[1]);
  153. vring_init(&vrh.vring, RINGSIZE, host_map, ALIGN);
  154. vringh_init_user(&vrh, features, RINGSIZE, true,
  155. vrh.vring.desc, vrh.vring.avail, vrh.vring.used);
  156. CPU_SET(first_cpu, &cpu_set);
  157. if (sched_setaffinity(getpid(), sizeof(cpu_set), &cpu_set))
  158. errx(1, "Could not set affinity to cpu %u", first_cpu);
  159. while (xfers < NUM_XFERS) {
  160. struct iovec host_riov[2], host_wiov[2];
  161. struct vringh_iov riov, wiov;
  162. u16 head, written;
  163. if (fast_vringh) {
  164. for (;;) {
  165. err = vringh_get_head(&vrh, &head);
  166. if (err != 0)
  167. break;
  168. err = vringh_need_notify_user(&vrh);
  169. if (err < 0)
  170. errx(1, "vringh_need_notify_user: %i",
  171. err);
  172. if (err) {
  173. write(to_guest[1], "", 1);
  174. notifies++;
  175. }
  176. }
  177. if (err != 1)
  178. errx(1, "vringh_get_head");
  179. written = 0;
  180. goto complete;
  181. } else {
  182. vringh_iov_init(&riov,
  183. host_riov,
  184. ARRAY_SIZE(host_riov));
  185. vringh_iov_init(&wiov,
  186. host_wiov,
  187. ARRAY_SIZE(host_wiov));
  188. err = vringh_getdesc_user(&vrh, &riov, &wiov,
  189. getrange, &head);
  190. }
  191. if (err == 0) {
  192. err = vringh_need_notify_user(&vrh);
  193. if (err < 0)
  194. errx(1, "vringh_need_notify_user: %i",
  195. err);
  196. if (err) {
  197. write(to_guest[1], "", 1);
  198. notifies++;
  199. }
  200. if (!vringh_notify_enable_user(&vrh))
  201. continue;
  202. /* Swallow all notifies at once. */
  203. if (read(to_host[0], buf, sizeof(buf)) < 1)
  204. break;
  205. vringh_notify_disable_user(&vrh);
  206. receives++;
  207. continue;
  208. }
  209. if (err != 1)
  210. errx(1, "vringh_getdesc_user: %i", err);
  211. /* We simply copy bytes. */
  212. if (riov.used) {
  213. rlen = vringh_iov_pull_user(&riov, rbuf,
  214. sizeof(rbuf));
  215. if (rlen != 4)
  216. errx(1, "vringh_iov_pull_user: %i",
  217. rlen);
  218. assert(riov.i == riov.used);
  219. written = 0;
  220. } else {
  221. err = vringh_iov_push_user(&wiov, rbuf, rlen);
  222. if (err != rlen)
  223. errx(1, "vringh_iov_push_user: %i",
  224. err);
  225. assert(wiov.i == wiov.used);
  226. written = err;
  227. }
  228. complete:
  229. xfers++;
  230. err = vringh_complete_user(&vrh, head, written);
  231. if (err != 0)
  232. errx(1, "vringh_complete_user: %i", err);
  233. }
  234. err = vringh_need_notify_user(&vrh);
  235. if (err < 0)
  236. errx(1, "vringh_need_notify_user: %i", err);
  237. if (err) {
  238. write(to_guest[1], "", 1);
  239. notifies++;
  240. }
  241. wait(&status);
  242. if (!WIFEXITED(status))
  243. errx(1, "Child died with signal %i?", WTERMSIG(status));
  244. if (WEXITSTATUS(status) != 0)
  245. errx(1, "Child exited %i?", WEXITSTATUS(status));
  246. printf("Host: notified %lu, pinged %lu\n", notifies, receives);
  247. return 0;
  248. } else {
  249. struct guest_virtio_device gvdev;
  250. struct virtqueue *vq;
  251. unsigned int *data;
  252. struct vring_desc *indirects;
  253. unsigned int finished = 0;
  254. /* We pass sg[]s pointing into here, but we need RINGSIZE+1 */
  255. data = guest_map + vring_size(RINGSIZE, ALIGN);
  256. indirects = (void *)data + (RINGSIZE + 1) * 2 * sizeof(int);
  257. /* We are the guest. */
  258. munmap(host_map, mapsize);
  259. close(to_guest[1]);
  260. close(to_host[0]);
  261. gvdev.vdev.features[0] = features;
  262. gvdev.to_host_fd = to_host[1];
  263. gvdev.notifies = 0;
  264. CPU_SET(first_cpu, &cpu_set);
  265. if (sched_setaffinity(getpid(), sizeof(cpu_set), &cpu_set))
  266. err(1, "Could not set affinity to cpu %u", first_cpu);
  267. vq = vring_new_virtqueue(0, RINGSIZE, ALIGN, &gvdev.vdev, true,
  268. guest_map, fast_vringh ? no_notify_host
  269. : parallel_notify_host,
  270. never_callback_guest, "guest vq");
  271. /* Don't kfree indirects. */
  272. __kfree_ignore_start = indirects;
  273. __kfree_ignore_end = indirects + RINGSIZE * 6;
  274. while (xfers < NUM_XFERS) {
  275. struct scatterlist sg[4];
  276. unsigned int num_sg, len;
  277. int *dbuf, err;
  278. bool output = !(xfers % 2);
  279. /* Consume bufs. */
  280. while ((dbuf = virtqueue_get_buf(vq, &len)) != NULL) {
  281. if (len == 4)
  282. assert(*dbuf == finished - 1);
  283. else if (!fast_vringh)
  284. assert(*dbuf == finished);
  285. finished++;
  286. }
  287. /* Produce a buffer. */
  288. dbuf = data + (xfers % (RINGSIZE + 1));
  289. if (output)
  290. *dbuf = xfers;
  291. else
  292. *dbuf = -1;
  293. switch ((xfers / sizeof(*dbuf)) % 4) {
  294. case 0:
  295. /* Nasty three-element sg list. */
  296. sg_init_table(sg, num_sg = 3);
  297. sg_set_buf(&sg[0], (void *)dbuf, 1);
  298. sg_set_buf(&sg[1], (void *)dbuf + 1, 2);
  299. sg_set_buf(&sg[2], (void *)dbuf + 3, 1);
  300. break;
  301. case 1:
  302. sg_init_table(sg, num_sg = 2);
  303. sg_set_buf(&sg[0], (void *)dbuf, 1);
  304. sg_set_buf(&sg[1], (void *)dbuf + 1, 3);
  305. break;
  306. case 2:
  307. sg_init_table(sg, num_sg = 1);
  308. sg_set_buf(&sg[0], (void *)dbuf, 4);
  309. break;
  310. case 3:
  311. sg_init_table(sg, num_sg = 4);
  312. sg_set_buf(&sg[0], (void *)dbuf, 1);
  313. sg_set_buf(&sg[1], (void *)dbuf + 1, 1);
  314. sg_set_buf(&sg[2], (void *)dbuf + 2, 1);
  315. sg_set_buf(&sg[3], (void *)dbuf + 3, 1);
  316. break;
  317. }
  318. /* May allocate an indirect, so force it to allocate
  319. * user addr */
  320. __kmalloc_fake = indirects + (xfers % RINGSIZE) * 4;
  321. if (output)
  322. err = virtqueue_add_outbuf(vq, sg, num_sg, dbuf,
  323. GFP_KERNEL);
  324. else
  325. err = virtqueue_add_inbuf(vq, sg, num_sg,
  326. dbuf, GFP_KERNEL);
  327. if (err == -ENOSPC) {
  328. if (!virtqueue_enable_cb_delayed(vq))
  329. continue;
  330. /* Swallow all notifies at once. */
  331. if (read(to_guest[0], buf, sizeof(buf)) < 1)
  332. break;
  333. receives++;
  334. virtqueue_disable_cb(vq);
  335. continue;
  336. }
  337. if (err)
  338. errx(1, "virtqueue_add_in/outbuf: %i", err);
  339. xfers++;
  340. virtqueue_kick(vq);
  341. }
  342. /* Any extra? */
  343. while (finished != xfers) {
  344. int *dbuf;
  345. unsigned int len;
  346. /* Consume bufs. */
  347. dbuf = virtqueue_get_buf(vq, &len);
  348. if (dbuf) {
  349. if (len == 4)
  350. assert(*dbuf == finished - 1);
  351. else
  352. assert(len == 0);
  353. finished++;
  354. continue;
  355. }
  356. if (!virtqueue_enable_cb_delayed(vq))
  357. continue;
  358. if (read(to_guest[0], buf, sizeof(buf)) < 1)
  359. break;
  360. receives++;
  361. virtqueue_disable_cb(vq);
  362. }
  363. printf("Guest: notified %lu, pinged %lu\n",
  364. gvdev.notifies, receives);
  365. vring_del_virtqueue(vq);
  366. return 0;
  367. }
  368. }
  369. int main(int argc, char *argv[])
  370. {
  371. struct virtio_device vdev;
  372. struct virtqueue *vq;
  373. struct vringh vrh;
  374. struct scatterlist guest_sg[RINGSIZE], *sgs[2];
  375. struct iovec host_riov[2], host_wiov[2];
  376. struct vringh_iov riov, wiov;
  377. struct vring_used_elem used[RINGSIZE];
  378. char buf[28];
  379. u16 head;
  380. int err;
  381. unsigned i;
  382. void *ret;
  383. bool (*getrange)(struct vringh *vrh, u64 addr, struct vringh_range *r);
  384. bool fast_vringh = false, parallel = false;
  385. getrange = getrange_iov;
  386. vdev.features[0] = 0;
  387. while (argv[1]) {
  388. if (strcmp(argv[1], "--indirect") == 0)
  389. vdev.features[0] |= (1 << VIRTIO_RING_F_INDIRECT_DESC);
  390. else if (strcmp(argv[1], "--eventidx") == 0)
  391. vdev.features[0] |= (1 << VIRTIO_RING_F_EVENT_IDX);
  392. else if (strcmp(argv[1], "--slow-range") == 0)
  393. getrange = getrange_slow;
  394. else if (strcmp(argv[1], "--fast-vringh") == 0)
  395. fast_vringh = true;
  396. else if (strcmp(argv[1], "--parallel") == 0)
  397. parallel = true;
  398. else
  399. errx(1, "Unknown arg %s", argv[1]);
  400. argv++;
  401. }
  402. if (parallel)
  403. return parallel_test(vdev.features[0], getrange, fast_vringh);
  404. if (posix_memalign(&__user_addr_min, PAGE_SIZE, USER_MEM) != 0)
  405. abort();
  406. __user_addr_max = __user_addr_min + USER_MEM;
  407. memset(__user_addr_min, 0, vring_size(RINGSIZE, ALIGN));
  408. /* Set up guest side. */
  409. vq = vring_new_virtqueue(0, RINGSIZE, ALIGN, &vdev, true,
  410. __user_addr_min,
  411. never_notify_host, never_callback_guest,
  412. "guest vq");
  413. /* Set up host side. */
  414. vring_init(&vrh.vring, RINGSIZE, __user_addr_min, ALIGN);
  415. vringh_init_user(&vrh, vdev.features[0], RINGSIZE, true,
  416. vrh.vring.desc, vrh.vring.avail, vrh.vring.used);
  417. /* No descriptor to get yet... */
  418. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  419. if (err != 0)
  420. errx(1, "vringh_getdesc_user: %i", err);
  421. /* Guest puts in a descriptor. */
  422. memcpy(__user_addr_max - 1, "a", 1);
  423. sg_init_table(guest_sg, 1);
  424. sg_set_buf(&guest_sg[0], __user_addr_max - 1, 1);
  425. sg_init_table(guest_sg+1, 1);
  426. sg_set_buf(&guest_sg[1], __user_addr_max - 3, 2);
  427. sgs[0] = &guest_sg[0];
  428. sgs[1] = &guest_sg[1];
  429. /* May allocate an indirect, so force it to allocate user addr */
  430. __kmalloc_fake = __user_addr_min + vring_size(RINGSIZE, ALIGN);
  431. err = virtqueue_add_sgs(vq, sgs, 1, 1, &err, GFP_KERNEL);
  432. if (err)
  433. errx(1, "virtqueue_add_sgs: %i", err);
  434. __kmalloc_fake = NULL;
  435. /* Host retreives it. */
  436. vringh_iov_init(&riov, host_riov, ARRAY_SIZE(host_riov));
  437. vringh_iov_init(&wiov, host_wiov, ARRAY_SIZE(host_wiov));
  438. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  439. if (err != 1)
  440. errx(1, "vringh_getdesc_user: %i", err);
  441. assert(riov.used == 1);
  442. assert(riov.iov[0].iov_base == __user_addr_max - 1);
  443. assert(riov.iov[0].iov_len == 1);
  444. if (getrange != getrange_slow) {
  445. assert(wiov.used == 1);
  446. assert(wiov.iov[0].iov_base == __user_addr_max - 3);
  447. assert(wiov.iov[0].iov_len == 2);
  448. } else {
  449. assert(wiov.used == 2);
  450. assert(wiov.iov[0].iov_base == __user_addr_max - 3);
  451. assert(wiov.iov[0].iov_len == 1);
  452. assert(wiov.iov[1].iov_base == __user_addr_max - 2);
  453. assert(wiov.iov[1].iov_len == 1);
  454. }
  455. err = vringh_iov_pull_user(&riov, buf, 5);
  456. if (err != 1)
  457. errx(1, "vringh_iov_pull_user: %i", err);
  458. assert(buf[0] == 'a');
  459. assert(riov.i == 1);
  460. assert(vringh_iov_pull_user(&riov, buf, 5) == 0);
  461. memcpy(buf, "bcdef", 5);
  462. err = vringh_iov_push_user(&wiov, buf, 5);
  463. if (err != 2)
  464. errx(1, "vringh_iov_push_user: %i", err);
  465. assert(memcmp(__user_addr_max - 3, "bc", 2) == 0);
  466. assert(wiov.i == wiov.used);
  467. assert(vringh_iov_push_user(&wiov, buf, 5) == 0);
  468. /* Host is done. */
  469. err = vringh_complete_user(&vrh, head, err);
  470. if (err != 0)
  471. errx(1, "vringh_complete_user: %i", err);
  472. /* Guest should see used token now. */
  473. __kfree_ignore_start = __user_addr_min + vring_size(RINGSIZE, ALIGN);
  474. __kfree_ignore_end = __kfree_ignore_start + 1;
  475. ret = virtqueue_get_buf(vq, &i);
  476. if (ret != &err)
  477. errx(1, "virtqueue_get_buf: %p", ret);
  478. assert(i == 2);
  479. /* Guest puts in a huge descriptor. */
  480. sg_init_table(guest_sg, RINGSIZE);
  481. for (i = 0; i < RINGSIZE; i++) {
  482. sg_set_buf(&guest_sg[i],
  483. __user_addr_max - USER_MEM/4, USER_MEM/4);
  484. }
  485. /* Fill contents with recognisable garbage. */
  486. for (i = 0; i < USER_MEM/4; i++)
  487. ((char *)__user_addr_max - USER_MEM/4)[i] = i;
  488. /* This will allocate an indirect, so force it to allocate user addr */
  489. __kmalloc_fake = __user_addr_min + vring_size(RINGSIZE, ALIGN);
  490. err = virtqueue_add_outbuf(vq, guest_sg, RINGSIZE, &err, GFP_KERNEL);
  491. if (err)
  492. errx(1, "virtqueue_add_outbuf (large): %i", err);
  493. __kmalloc_fake = NULL;
  494. /* Host picks it up (allocates new iov). */
  495. vringh_iov_init(&riov, host_riov, ARRAY_SIZE(host_riov));
  496. vringh_iov_init(&wiov, host_wiov, ARRAY_SIZE(host_wiov));
  497. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  498. if (err != 1)
  499. errx(1, "vringh_getdesc_user: %i", err);
  500. assert(riov.max_num & VRINGH_IOV_ALLOCATED);
  501. assert(riov.iov != host_riov);
  502. if (getrange != getrange_slow)
  503. assert(riov.used == RINGSIZE);
  504. else
  505. assert(riov.used == RINGSIZE * USER_MEM/4);
  506. assert(!(wiov.max_num & VRINGH_IOV_ALLOCATED));
  507. assert(wiov.used == 0);
  508. /* Pull data back out (in odd chunks), should be as expected. */
  509. for (i = 0; i < RINGSIZE * USER_MEM/4; i += 3) {
  510. err = vringh_iov_pull_user(&riov, buf, 3);
  511. if (err != 3 && i + err != RINGSIZE * USER_MEM/4)
  512. errx(1, "vringh_iov_pull_user large: %i", err);
  513. assert(buf[0] == (char)i);
  514. assert(err < 2 || buf[1] == (char)(i + 1));
  515. assert(err < 3 || buf[2] == (char)(i + 2));
  516. }
  517. assert(riov.i == riov.used);
  518. vringh_iov_cleanup(&riov);
  519. vringh_iov_cleanup(&wiov);
  520. /* Complete using multi interface, just because we can. */
  521. used[0].id = head;
  522. used[0].len = 0;
  523. err = vringh_complete_multi_user(&vrh, used, 1);
  524. if (err)
  525. errx(1, "vringh_complete_multi_user(1): %i", err);
  526. /* Free up those descriptors. */
  527. ret = virtqueue_get_buf(vq, &i);
  528. if (ret != &err)
  529. errx(1, "virtqueue_get_buf: %p", ret);
  530. /* Add lots of descriptors. */
  531. sg_init_table(guest_sg, 1);
  532. sg_set_buf(&guest_sg[0], __user_addr_max - 1, 1);
  533. for (i = 0; i < RINGSIZE; i++) {
  534. err = virtqueue_add_outbuf(vq, guest_sg, 1, &err, GFP_KERNEL);
  535. if (err)
  536. errx(1, "virtqueue_add_outbuf (multiple): %i", err);
  537. }
  538. /* Now get many, and consume them all at once. */
  539. vringh_iov_init(&riov, host_riov, ARRAY_SIZE(host_riov));
  540. vringh_iov_init(&wiov, host_wiov, ARRAY_SIZE(host_wiov));
  541. for (i = 0; i < RINGSIZE; i++) {
  542. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  543. if (err != 1)
  544. errx(1, "vringh_getdesc_user: %i", err);
  545. used[i].id = head;
  546. used[i].len = 0;
  547. }
  548. /* Make sure it wraps around ring, to test! */
  549. assert(vrh.vring.used->idx % RINGSIZE != 0);
  550. err = vringh_complete_multi_user(&vrh, used, RINGSIZE);
  551. if (err)
  552. errx(1, "vringh_complete_multi_user: %i", err);
  553. /* Free those buffers. */
  554. for (i = 0; i < RINGSIZE; i++) {
  555. unsigned len;
  556. assert(virtqueue_get_buf(vq, &len) != NULL);
  557. }
  558. /* Test weird (but legal!) indirect. */
  559. if (vdev.features[0] & (1 << VIRTIO_RING_F_INDIRECT_DESC)) {
  560. char *data = __user_addr_max - USER_MEM/4;
  561. struct vring_desc *d = __user_addr_max - USER_MEM/2;
  562. struct vring vring;
  563. /* Force creation of direct, which we modify. */
  564. vdev.features[0] &= ~(1 << VIRTIO_RING_F_INDIRECT_DESC);
  565. vq = vring_new_virtqueue(0, RINGSIZE, ALIGN, &vdev, true,
  566. __user_addr_min,
  567. never_notify_host,
  568. never_callback_guest,
  569. "guest vq");
  570. sg_init_table(guest_sg, 4);
  571. sg_set_buf(&guest_sg[0], d, sizeof(*d)*2);
  572. sg_set_buf(&guest_sg[1], d + 2, sizeof(*d)*1);
  573. sg_set_buf(&guest_sg[2], data + 6, 4);
  574. sg_set_buf(&guest_sg[3], d + 3, sizeof(*d)*3);
  575. err = virtqueue_add_outbuf(vq, guest_sg, 4, &err, GFP_KERNEL);
  576. if (err)
  577. errx(1, "virtqueue_add_outbuf (indirect): %i", err);
  578. vring_init(&vring, RINGSIZE, __user_addr_min, ALIGN);
  579. /* They're used in order, but double-check... */
  580. assert(vring.desc[0].addr == (unsigned long)d);
  581. assert(vring.desc[1].addr == (unsigned long)(d+2));
  582. assert(vring.desc[2].addr == (unsigned long)data + 6);
  583. assert(vring.desc[3].addr == (unsigned long)(d+3));
  584. vring.desc[0].flags |= VRING_DESC_F_INDIRECT;
  585. vring.desc[1].flags |= VRING_DESC_F_INDIRECT;
  586. vring.desc[3].flags |= VRING_DESC_F_INDIRECT;
  587. /* First indirect */
  588. d[0].addr = (unsigned long)data;
  589. d[0].len = 1;
  590. d[0].flags = VRING_DESC_F_NEXT;
  591. d[0].next = 1;
  592. d[1].addr = (unsigned long)data + 1;
  593. d[1].len = 2;
  594. d[1].flags = 0;
  595. /* Second indirect */
  596. d[2].addr = (unsigned long)data + 3;
  597. d[2].len = 3;
  598. d[2].flags = 0;
  599. /* Third indirect */
  600. d[3].addr = (unsigned long)data + 10;
  601. d[3].len = 5;
  602. d[3].flags = VRING_DESC_F_NEXT;
  603. d[3].next = 1;
  604. d[4].addr = (unsigned long)data + 15;
  605. d[4].len = 6;
  606. d[4].flags = VRING_DESC_F_NEXT;
  607. d[4].next = 2;
  608. d[5].addr = (unsigned long)data + 21;
  609. d[5].len = 7;
  610. d[5].flags = 0;
  611. /* Host picks it up (allocates new iov). */
  612. vringh_iov_init(&riov, host_riov, ARRAY_SIZE(host_riov));
  613. vringh_iov_init(&wiov, host_wiov, ARRAY_SIZE(host_wiov));
  614. err = vringh_getdesc_user(&vrh, &riov, &wiov, getrange, &head);
  615. if (err != 1)
  616. errx(1, "vringh_getdesc_user: %i", err);
  617. if (head != 0)
  618. errx(1, "vringh_getdesc_user: head %i not 0", head);
  619. assert(riov.max_num & VRINGH_IOV_ALLOCATED);
  620. if (getrange != getrange_slow)
  621. assert(riov.used == 7);
  622. else
  623. assert(riov.used == 28);
  624. err = vringh_iov_pull_user(&riov, buf, 29);
  625. assert(err == 28);
  626. /* Data should be linear. */
  627. for (i = 0; i < err; i++)
  628. assert(buf[i] == i);
  629. vringh_iov_cleanup(&riov);
  630. }
  631. /* Don't leak memory... */
  632. vring_del_virtqueue(vq);
  633. free(__user_addr_min);
  634. return 0;
  635. }