rados.h 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481
  1. #ifndef CEPH_RADOS_H
  2. #define CEPH_RADOS_H
  3. /*
  4. * Data types for the Ceph distributed object storage layer RADOS
  5. * (Reliable Autonomic Distributed Object Store).
  6. */
  7. #include <linux/ceph/msgr.h>
  8. /*
  9. * osdmap encoding versions
  10. */
  11. #define CEPH_OSDMAP_INC_VERSION 5
  12. #define CEPH_OSDMAP_INC_VERSION_EXT 6
  13. #define CEPH_OSDMAP_VERSION 5
  14. #define CEPH_OSDMAP_VERSION_EXT 6
  15. /*
  16. * fs id
  17. */
  18. struct ceph_fsid {
  19. unsigned char fsid[16];
  20. };
  21. static inline int ceph_fsid_compare(const struct ceph_fsid *a,
  22. const struct ceph_fsid *b)
  23. {
  24. return memcmp(a, b, sizeof(*a));
  25. }
  26. /*
  27. * ino, object, etc.
  28. */
  29. typedef __le64 ceph_snapid_t;
  30. #define CEPH_SNAPDIR ((__u64)(-1)) /* reserved for hidden .snap dir */
  31. #define CEPH_NOSNAP ((__u64)(-2)) /* "head", "live" revision */
  32. #define CEPH_MAXSNAP ((__u64)(-3)) /* largest valid snapid */
  33. struct ceph_timespec {
  34. __le32 tv_sec;
  35. __le32 tv_nsec;
  36. } __attribute__ ((packed));
  37. /*
  38. * object layout - how objects are mapped into PGs
  39. */
  40. #define CEPH_OBJECT_LAYOUT_HASH 1
  41. #define CEPH_OBJECT_LAYOUT_LINEAR 2
  42. #define CEPH_OBJECT_LAYOUT_HASHINO 3
  43. /*
  44. * pg layout -- how PGs are mapped onto (sets of) OSDs
  45. */
  46. #define CEPH_PG_LAYOUT_CRUSH 0
  47. #define CEPH_PG_LAYOUT_HASH 1
  48. #define CEPH_PG_LAYOUT_LINEAR 2
  49. #define CEPH_PG_LAYOUT_HYBRID 3
  50. #define CEPH_PG_MAX_SIZE 16 /* max # osds in a single pg */
  51. /*
  52. * placement group.
  53. * we encode this into one __le64.
  54. */
  55. struct ceph_pg {
  56. __le16 preferred; /* preferred primary osd */
  57. __le16 ps; /* placement seed */
  58. __le32 pool; /* object pool */
  59. } __attribute__ ((packed));
  60. /*
  61. * pg_pool is a set of pgs storing a pool of objects
  62. *
  63. * pg_num -- base number of pseudorandomly placed pgs
  64. *
  65. * pgp_num -- effective number when calculating pg placement. this
  66. * is used for pg_num increases. new pgs result in data being "split"
  67. * into new pgs. for this to proceed smoothly, new pgs are intiially
  68. * colocated with their parents; that is, pgp_num doesn't increase
  69. * until the new pgs have successfully split. only _then_ are the new
  70. * pgs placed independently.
  71. *
  72. * lpg_num -- localized pg count (per device). replicas are randomly
  73. * selected.
  74. *
  75. * lpgp_num -- as above.
  76. */
  77. #define CEPH_NOPOOL ((__u64) (-1)) /* pool id not defined */
  78. #define CEPH_PG_TYPE_REP 1
  79. #define CEPH_PG_TYPE_RAID4 2
  80. #define CEPH_PG_POOL_VERSION 2
  81. struct ceph_pg_pool {
  82. __u8 type; /* CEPH_PG_TYPE_* */
  83. __u8 size; /* number of osds in each pg */
  84. __u8 crush_ruleset; /* crush placement rule */
  85. __u8 object_hash; /* hash mapping object name to ps */
  86. __le32 pg_num, pgp_num; /* number of pg's */
  87. __le32 lpg_num, lpgp_num; /* number of localized pg's */
  88. __le32 last_change; /* most recent epoch changed */
  89. __le64 snap_seq; /* seq for per-pool snapshot */
  90. __le32 snap_epoch; /* epoch of last snap */
  91. __le32 num_snaps;
  92. __le32 num_removed_snap_intervals; /* if non-empty, NO per-pool snaps */
  93. __le64 auid; /* who owns the pg */
  94. } __attribute__ ((packed));
  95. /*
  96. * stable_mod func is used to control number of placement groups.
  97. * similar to straight-up modulo, but produces a stable mapping as b
  98. * increases over time. b is the number of bins, and bmask is the
  99. * containing power of 2 minus 1.
  100. *
  101. * b <= bmask and bmask=(2**n)-1
  102. * e.g., b=12 -> bmask=15, b=123 -> bmask=127
  103. */
  104. static inline int ceph_stable_mod(int x, int b, int bmask)
  105. {
  106. if ((x & bmask) < b)
  107. return x & bmask;
  108. else
  109. return x & (bmask >> 1);
  110. }
  111. /*
  112. * object layout - how a given object should be stored.
  113. */
  114. struct ceph_object_layout {
  115. struct ceph_pg ol_pgid; /* raw pg, with _full_ ps precision. */
  116. __le32 ol_stripe_unit; /* for per-object parity, if any */
  117. } __attribute__ ((packed));
  118. /*
  119. * compound epoch+version, used by storage layer to serialize mutations
  120. */
  121. struct ceph_eversion {
  122. __le32 epoch;
  123. __le64 version;
  124. } __attribute__ ((packed));
  125. /*
  126. * osd map bits
  127. */
  128. /* status bits */
  129. #define CEPH_OSD_EXISTS (1<<0)
  130. #define CEPH_OSD_UP (1<<1)
  131. #define CEPH_OSD_AUTOOUT (1<<2) /* osd was automatically marked out */
  132. #define CEPH_OSD_NEW (1<<3) /* osd is new, never marked in */
  133. extern const char *ceph_osd_state_name(int s);
  134. /* osd weights. fixed point value: 0x10000 == 1.0 ("in"), 0 == "out" */
  135. #define CEPH_OSD_IN 0x10000
  136. #define CEPH_OSD_OUT 0
  137. /*
  138. * osd map flag bits
  139. */
  140. #define CEPH_OSDMAP_NEARFULL (1<<0) /* sync writes (near ENOSPC) */
  141. #define CEPH_OSDMAP_FULL (1<<1) /* no data writes (ENOSPC) */
  142. #define CEPH_OSDMAP_PAUSERD (1<<2) /* pause all reads */
  143. #define CEPH_OSDMAP_PAUSEWR (1<<3) /* pause all writes */
  144. #define CEPH_OSDMAP_PAUSEREC (1<<4) /* pause recovery */
  145. #define CEPH_OSDMAP_NOUP (1<<5) /* block osd boot */
  146. #define CEPH_OSDMAP_NODOWN (1<<6) /* block osd mark-down/failure */
  147. #define CEPH_OSDMAP_NOOUT (1<<7) /* block osd auto mark-out */
  148. #define CEPH_OSDMAP_NOIN (1<<8) /* block osd auto mark-in */
  149. #define CEPH_OSDMAP_NOBACKFILL (1<<9) /* block osd backfill */
  150. #define CEPH_OSDMAP_NORECOVER (1<<10) /* block osd recovery and backfill */
  151. /*
  152. * The error code to return when an OSD can't handle a write
  153. * because it is too large.
  154. */
  155. #define OSD_WRITETOOBIG EMSGSIZE
  156. /*
  157. * osd ops
  158. *
  159. * WARNING: do not use these op codes directly. Use the helpers
  160. * defined below instead. In certain cases, op code behavior was
  161. * redefined, resulting in special-cases in the helpers.
  162. */
  163. #define CEPH_OSD_OP_MODE 0xf000
  164. #define CEPH_OSD_OP_MODE_RD 0x1000
  165. #define CEPH_OSD_OP_MODE_WR 0x2000
  166. #define CEPH_OSD_OP_MODE_RMW 0x3000
  167. #define CEPH_OSD_OP_MODE_SUB 0x4000
  168. #define CEPH_OSD_OP_TYPE 0x0f00
  169. #define CEPH_OSD_OP_TYPE_LOCK 0x0100
  170. #define CEPH_OSD_OP_TYPE_DATA 0x0200
  171. #define CEPH_OSD_OP_TYPE_ATTR 0x0300
  172. #define CEPH_OSD_OP_TYPE_EXEC 0x0400
  173. #define CEPH_OSD_OP_TYPE_PG 0x0500
  174. #define CEPH_OSD_OP_TYPE_MULTI 0x0600 /* multiobject */
  175. enum {
  176. /** data **/
  177. /* read */
  178. CEPH_OSD_OP_READ = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 1,
  179. CEPH_OSD_OP_STAT = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 2,
  180. CEPH_OSD_OP_MAPEXT = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 3,
  181. /* fancy read */
  182. CEPH_OSD_OP_MASKTRUNC = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 4,
  183. CEPH_OSD_OP_SPARSE_READ = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 5,
  184. CEPH_OSD_OP_NOTIFY = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 6,
  185. CEPH_OSD_OP_NOTIFY_ACK = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 7,
  186. /* versioning */
  187. CEPH_OSD_OP_ASSERT_VER = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 8,
  188. /* write */
  189. CEPH_OSD_OP_WRITE = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 1,
  190. CEPH_OSD_OP_WRITEFULL = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 2,
  191. CEPH_OSD_OP_TRUNCATE = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 3,
  192. CEPH_OSD_OP_ZERO = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 4,
  193. CEPH_OSD_OP_DELETE = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 5,
  194. /* fancy write */
  195. CEPH_OSD_OP_APPEND = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 6,
  196. CEPH_OSD_OP_STARTSYNC = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 7,
  197. CEPH_OSD_OP_SETTRUNC = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 8,
  198. CEPH_OSD_OP_TRIMTRUNC = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 9,
  199. CEPH_OSD_OP_TMAPUP = CEPH_OSD_OP_MODE_RMW | CEPH_OSD_OP_TYPE_DATA | 10,
  200. CEPH_OSD_OP_TMAPPUT = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 11,
  201. CEPH_OSD_OP_TMAPGET = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 12,
  202. CEPH_OSD_OP_CREATE = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 13,
  203. CEPH_OSD_OP_ROLLBACK= CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 14,
  204. CEPH_OSD_OP_WATCH = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 15,
  205. /* omap */
  206. CEPH_OSD_OP_OMAPGETKEYS = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 17,
  207. CEPH_OSD_OP_OMAPGETVALS = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 18,
  208. CEPH_OSD_OP_OMAPGETHEADER = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 19,
  209. CEPH_OSD_OP_OMAPGETVALSBYKEYS =
  210. CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 20,
  211. CEPH_OSD_OP_OMAPSETVALS = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 21,
  212. CEPH_OSD_OP_OMAPSETHEADER = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 22,
  213. CEPH_OSD_OP_OMAPCLEAR = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 23,
  214. CEPH_OSD_OP_OMAPRMKEYS = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 24,
  215. CEPH_OSD_OP_OMAP_CMP = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 25,
  216. /** multi **/
  217. CEPH_OSD_OP_CLONERANGE = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_MULTI | 1,
  218. CEPH_OSD_OP_ASSERT_SRC_VERSION = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_MULTI | 2,
  219. CEPH_OSD_OP_SRC_CMPXATTR = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_MULTI | 3,
  220. /** attrs **/
  221. /* read */
  222. CEPH_OSD_OP_GETXATTR = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_ATTR | 1,
  223. CEPH_OSD_OP_GETXATTRS = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_ATTR | 2,
  224. CEPH_OSD_OP_CMPXATTR = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_ATTR | 3,
  225. /* write */
  226. CEPH_OSD_OP_SETXATTR = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_ATTR | 1,
  227. CEPH_OSD_OP_SETXATTRS = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_ATTR | 2,
  228. CEPH_OSD_OP_RESETXATTRS = CEPH_OSD_OP_MODE_WR|CEPH_OSD_OP_TYPE_ATTR | 3,
  229. CEPH_OSD_OP_RMXATTR = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_ATTR | 4,
  230. /** subop **/
  231. CEPH_OSD_OP_PULL = CEPH_OSD_OP_MODE_SUB | 1,
  232. CEPH_OSD_OP_PUSH = CEPH_OSD_OP_MODE_SUB | 2,
  233. CEPH_OSD_OP_BALANCEREADS = CEPH_OSD_OP_MODE_SUB | 3,
  234. CEPH_OSD_OP_UNBALANCEREADS = CEPH_OSD_OP_MODE_SUB | 4,
  235. CEPH_OSD_OP_SCRUB = CEPH_OSD_OP_MODE_SUB | 5,
  236. CEPH_OSD_OP_SCRUB_RESERVE = CEPH_OSD_OP_MODE_SUB | 6,
  237. CEPH_OSD_OP_SCRUB_UNRESERVE = CEPH_OSD_OP_MODE_SUB | 7,
  238. CEPH_OSD_OP_SCRUB_STOP = CEPH_OSD_OP_MODE_SUB | 8,
  239. CEPH_OSD_OP_SCRUB_MAP = CEPH_OSD_OP_MODE_SUB | 9,
  240. /** lock **/
  241. CEPH_OSD_OP_WRLOCK = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_LOCK | 1,
  242. CEPH_OSD_OP_WRUNLOCK = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_LOCK | 2,
  243. CEPH_OSD_OP_RDLOCK = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_LOCK | 3,
  244. CEPH_OSD_OP_RDUNLOCK = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_LOCK | 4,
  245. CEPH_OSD_OP_UPLOCK = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_LOCK | 5,
  246. CEPH_OSD_OP_DNLOCK = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_LOCK | 6,
  247. /** exec **/
  248. /* note: the RD bit here is wrong; see special-case below in helper */
  249. CEPH_OSD_OP_CALL = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_EXEC | 1,
  250. /** pg **/
  251. CEPH_OSD_OP_PGLS = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_PG | 1,
  252. CEPH_OSD_OP_PGLS_FILTER = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_PG | 2,
  253. };
  254. static inline int ceph_osd_op_type_lock(int op)
  255. {
  256. return (op & CEPH_OSD_OP_TYPE) == CEPH_OSD_OP_TYPE_LOCK;
  257. }
  258. static inline int ceph_osd_op_type_data(int op)
  259. {
  260. return (op & CEPH_OSD_OP_TYPE) == CEPH_OSD_OP_TYPE_DATA;
  261. }
  262. static inline int ceph_osd_op_type_attr(int op)
  263. {
  264. return (op & CEPH_OSD_OP_TYPE) == CEPH_OSD_OP_TYPE_ATTR;
  265. }
  266. static inline int ceph_osd_op_type_exec(int op)
  267. {
  268. return (op & CEPH_OSD_OP_TYPE) == CEPH_OSD_OP_TYPE_EXEC;
  269. }
  270. static inline int ceph_osd_op_type_pg(int op)
  271. {
  272. return (op & CEPH_OSD_OP_TYPE) == CEPH_OSD_OP_TYPE_PG;
  273. }
  274. static inline int ceph_osd_op_type_multi(int op)
  275. {
  276. return (op & CEPH_OSD_OP_TYPE) == CEPH_OSD_OP_TYPE_MULTI;
  277. }
  278. static inline int ceph_osd_op_mode_subop(int op)
  279. {
  280. return (op & CEPH_OSD_OP_MODE) == CEPH_OSD_OP_MODE_SUB;
  281. }
  282. static inline int ceph_osd_op_mode_read(int op)
  283. {
  284. return (op & CEPH_OSD_OP_MODE_RD) &&
  285. op != CEPH_OSD_OP_CALL;
  286. }
  287. static inline int ceph_osd_op_mode_modify(int op)
  288. {
  289. return op & CEPH_OSD_OP_MODE_WR;
  290. }
  291. /*
  292. * note that the following tmap stuff is also defined in the ceph librados.h
  293. * any modification here needs to be updated there
  294. */
  295. #define CEPH_OSD_TMAP_HDR 'h'
  296. #define CEPH_OSD_TMAP_SET 's'
  297. #define CEPH_OSD_TMAP_CREATE 'c' /* create key */
  298. #define CEPH_OSD_TMAP_RM 'r'
  299. #define CEPH_OSD_TMAP_RMSLOPPY 'R'
  300. extern const char *ceph_osd_op_name(int op);
  301. /*
  302. * osd op flags
  303. *
  304. * An op may be READ, WRITE, or READ|WRITE.
  305. */
  306. enum {
  307. CEPH_OSD_FLAG_ACK = 0x0001, /* want (or is) "ack" ack */
  308. CEPH_OSD_FLAG_ONNVRAM = 0x0002, /* want (or is) "onnvram" ack */
  309. CEPH_OSD_FLAG_ONDISK = 0x0004, /* want (or is) "ondisk" ack */
  310. CEPH_OSD_FLAG_RETRY = 0x0008, /* resend attempt */
  311. CEPH_OSD_FLAG_READ = 0x0010, /* op may read */
  312. CEPH_OSD_FLAG_WRITE = 0x0020, /* op may write */
  313. CEPH_OSD_FLAG_ORDERSNAP = 0x0040, /* EOLDSNAP if snapc is out of order */
  314. CEPH_OSD_FLAG_PEERSTAT_OLD = 0x0080, /* DEPRECATED msg includes osd_peer_stat */
  315. CEPH_OSD_FLAG_BALANCE_READS = 0x0100,
  316. CEPH_OSD_FLAG_PARALLELEXEC = 0x0200, /* execute op in parallel */
  317. CEPH_OSD_FLAG_PGOP = 0x0400, /* pg op, no object */
  318. CEPH_OSD_FLAG_EXEC = 0x0800, /* op may exec */
  319. CEPH_OSD_FLAG_EXEC_PUBLIC = 0x1000, /* DEPRECATED op may exec (public) */
  320. CEPH_OSD_FLAG_LOCALIZE_READS = 0x2000, /* read from nearby replica, if any */
  321. CEPH_OSD_FLAG_RWORDERED = 0x4000, /* order wrt concurrent reads */
  322. };
  323. enum {
  324. CEPH_OSD_OP_FLAG_EXCL = 1, /* EXCL object create */
  325. CEPH_OSD_OP_FLAG_FAILOK = 2, /* continue despite failure */
  326. };
  327. #define EOLDSNAPC ERESTART /* ORDERSNAP flag set; writer has old snapc*/
  328. #define EBLACKLISTED ESHUTDOWN /* blacklisted */
  329. /* xattr comparison */
  330. enum {
  331. CEPH_OSD_CMPXATTR_OP_NOP = 0,
  332. CEPH_OSD_CMPXATTR_OP_EQ = 1,
  333. CEPH_OSD_CMPXATTR_OP_NE = 2,
  334. CEPH_OSD_CMPXATTR_OP_GT = 3,
  335. CEPH_OSD_CMPXATTR_OP_GTE = 4,
  336. CEPH_OSD_CMPXATTR_OP_LT = 5,
  337. CEPH_OSD_CMPXATTR_OP_LTE = 6
  338. };
  339. enum {
  340. CEPH_OSD_CMPXATTR_MODE_STRING = 1,
  341. CEPH_OSD_CMPXATTR_MODE_U64 = 2
  342. };
  343. #define RADOS_NOTIFY_VER 1
  344. /*
  345. * an individual object operation. each may be accompanied by some data
  346. * payload
  347. */
  348. struct ceph_osd_op {
  349. __le16 op; /* CEPH_OSD_OP_* */
  350. __le32 flags; /* CEPH_OSD_FLAG_* */
  351. union {
  352. struct {
  353. __le64 offset, length;
  354. __le64 truncate_size;
  355. __le32 truncate_seq;
  356. } __attribute__ ((packed)) extent;
  357. struct {
  358. __le32 name_len;
  359. __le32 value_len;
  360. __u8 cmp_op; /* CEPH_OSD_CMPXATTR_OP_* */
  361. __u8 cmp_mode; /* CEPH_OSD_CMPXATTR_MODE_* */
  362. } __attribute__ ((packed)) xattr;
  363. struct {
  364. __u8 class_len;
  365. __u8 method_len;
  366. __u8 argc;
  367. __le32 indata_len;
  368. } __attribute__ ((packed)) cls;
  369. struct {
  370. __le64 cookie, count;
  371. } __attribute__ ((packed)) pgls;
  372. struct {
  373. __le64 snapid;
  374. } __attribute__ ((packed)) snap;
  375. struct {
  376. __le64 cookie;
  377. __le64 ver;
  378. __u8 flag; /* 0 = unwatch, 1 = watch */
  379. } __attribute__ ((packed)) watch;
  380. struct {
  381. __le64 offset, length;
  382. __le64 src_offset;
  383. } __attribute__ ((packed)) clonerange;
  384. };
  385. __le32 payload_len;
  386. } __attribute__ ((packed));
  387. /*
  388. * osd request message header. each request may include multiple
  389. * ceph_osd_op object operations.
  390. */
  391. struct ceph_osd_request_head {
  392. __le32 client_inc; /* client incarnation */
  393. struct ceph_object_layout layout; /* pgid */
  394. __le32 osdmap_epoch; /* client's osdmap epoch */
  395. __le32 flags;
  396. struct ceph_timespec mtime; /* for mutations only */
  397. struct ceph_eversion reassert_version; /* if we are replaying op */
  398. __le32 object_len; /* length of object name */
  399. __le64 snapid; /* snapid to read */
  400. __le64 snap_seq; /* writer's snap context */
  401. __le32 num_snaps;
  402. __le16 num_ops;
  403. struct ceph_osd_op ops[]; /* followed by ops[], obj, ticket, snaps */
  404. } __attribute__ ((packed));
  405. struct ceph_osd_reply_head {
  406. __le32 client_inc; /* client incarnation */
  407. __le32 flags;
  408. struct ceph_object_layout layout;
  409. __le32 osdmap_epoch;
  410. struct ceph_eversion reassert_version; /* for replaying uncommitted */
  411. __le32 result; /* result code */
  412. __le32 object_len; /* length of object name */
  413. __le32 num_ops;
  414. struct ceph_osd_op ops[0]; /* ops[], object */
  415. } __attribute__ ((packed));
  416. #endif