13d14c5d2SYehuda Sadeh #ifndef _FS_CEPH_OSD_CLIENT_H 23d14c5d2SYehuda Sadeh #define _FS_CEPH_OSD_CLIENT_H 33d14c5d2SYehuda Sadeh 43d14c5d2SYehuda Sadeh #include <linux/completion.h> 53d14c5d2SYehuda Sadeh #include <linux/kref.h> 63d14c5d2SYehuda Sadeh #include <linux/mempool.h> 73d14c5d2SYehuda Sadeh #include <linux/rbtree.h> 83d14c5d2SYehuda Sadeh 96c4a1915SAlex Elder #include <linux/ceph/types.h> 106c4a1915SAlex Elder #include <linux/ceph/osdmap.h> 116c4a1915SAlex Elder #include <linux/ceph/messenger.h> 126c4a1915SAlex Elder #include <linux/ceph/auth.h> 13c885837fSAlex Elder #include <linux/ceph/pagelist.h> 143d14c5d2SYehuda Sadeh 15224736d9SStratos Psomadakis /* 16224736d9SStratos Psomadakis * Maximum object name size 17224736d9SStratos Psomadakis * (must be at least as big as RBD_MAX_MD_NAME_LEN -- currently 100) 18224736d9SStratos Psomadakis */ 19224736d9SStratos Psomadakis #define MAX_OBJ_NAME_SIZE 100 20224736d9SStratos Psomadakis 213d14c5d2SYehuda Sadeh struct ceph_msg; 223d14c5d2SYehuda Sadeh struct ceph_snap_context; 233d14c5d2SYehuda Sadeh struct ceph_osd_request; 243d14c5d2SYehuda Sadeh struct ceph_osd_client; 253d14c5d2SYehuda Sadeh struct ceph_authorizer; 263d14c5d2SYehuda Sadeh 273d14c5d2SYehuda Sadeh /* 283d14c5d2SYehuda Sadeh * completion callback for async writepages 293d14c5d2SYehuda Sadeh */ 303d14c5d2SYehuda Sadeh typedef void (*ceph_osdc_callback_t)(struct ceph_osd_request *, 313d14c5d2SYehuda Sadeh struct ceph_msg *); 323d14c5d2SYehuda Sadeh 333d14c5d2SYehuda Sadeh /* a given osd we're communicating with */ 343d14c5d2SYehuda Sadeh struct ceph_osd { 353d14c5d2SYehuda Sadeh atomic_t o_ref; 363d14c5d2SYehuda Sadeh struct ceph_osd_client *o_osdc; 373d14c5d2SYehuda Sadeh int o_osd; 383d14c5d2SYehuda Sadeh int o_incarnation; 393d14c5d2SYehuda Sadeh struct rb_node o_node; 403d14c5d2SYehuda Sadeh struct ceph_connection o_con; 413d14c5d2SYehuda Sadeh struct list_head o_requests; 42a40c4f10SYehuda Sadeh struct list_head o_linger_requests; 433d14c5d2SYehuda Sadeh struct list_head o_osd_lru; 446c4a1915SAlex Elder struct ceph_auth_handshake o_auth; 453d14c5d2SYehuda Sadeh unsigned long lru_ttl; 463d14c5d2SYehuda Sadeh int o_marked_for_keepalive; 473d14c5d2SYehuda Sadeh struct list_head o_keepalive_item; 483d14c5d2SYehuda Sadeh }; 493d14c5d2SYehuda Sadeh 501b83bef2SSage Weil 511b83bef2SSage Weil #define CEPH_OSD_MAX_OP 10 521b83bef2SSage Weil 533d14c5d2SYehuda Sadeh /* an in-flight request */ 543d14c5d2SYehuda Sadeh struct ceph_osd_request { 553d14c5d2SYehuda Sadeh u64 r_tid; /* unique for this client */ 563d14c5d2SYehuda Sadeh struct rb_node r_node; 573d14c5d2SYehuda Sadeh struct list_head r_req_lru_item; 583d14c5d2SYehuda Sadeh struct list_head r_osd_item; 59a40c4f10SYehuda Sadeh struct list_head r_linger_item; 60a40c4f10SYehuda Sadeh struct list_head r_linger_osd; 613d14c5d2SYehuda Sadeh struct ceph_osd *r_osd; 625b191d99SSage Weil struct ceph_pg r_pgid; 633d14c5d2SYehuda Sadeh int r_pg_osds[CEPH_PG_MAX_SIZE]; 643d14c5d2SYehuda Sadeh int r_num_pg_osds; 653d14c5d2SYehuda Sadeh 663d14c5d2SYehuda Sadeh struct ceph_connection *r_con_filling_msg; 673d14c5d2SYehuda Sadeh 683d14c5d2SYehuda Sadeh struct ceph_msg *r_request, *r_reply; 693d14c5d2SYehuda Sadeh int r_flags; /* any additional flags for the osd */ 703d14c5d2SYehuda Sadeh u32 r_sent; /* >0 if r_request is sending/sent */ 711b83bef2SSage Weil int r_num_ops; 721b83bef2SSage Weil 731b83bef2SSage Weil /* encoded message content */ 741b83bef2SSage Weil struct ceph_osd_op *r_request_ops; 751b83bef2SSage Weil /* these are updated on each send */ 761b83bef2SSage Weil __le32 *r_request_osdmap_epoch; 771b83bef2SSage Weil __le32 *r_request_flags; 781b83bef2SSage Weil __le64 *r_request_pool; 791b83bef2SSage Weil void *r_request_pgid; 801b83bef2SSage Weil __le32 *r_request_attempts; 811b83bef2SSage Weil struct ceph_eversion *r_request_reassert_version; 821b83bef2SSage Weil 831b83bef2SSage Weil int r_result; 841b83bef2SSage Weil int r_reply_op_len[CEPH_OSD_MAX_OP]; 851b83bef2SSage Weil s32 r_reply_op_result[CEPH_OSD_MAX_OP]; 863d14c5d2SYehuda Sadeh int r_got_reply; 87a40c4f10SYehuda Sadeh int r_linger; 880d5af164SAlex Elder int r_completed; 893d14c5d2SYehuda Sadeh 903d14c5d2SYehuda Sadeh struct ceph_osd_client *r_osdc; 913d14c5d2SYehuda Sadeh struct kref r_kref; 923d14c5d2SYehuda Sadeh bool r_mempool; 933d14c5d2SYehuda Sadeh struct completion r_completion, r_safe_completion; 943d14c5d2SYehuda Sadeh ceph_osdc_callback_t r_callback, r_safe_callback; 953d14c5d2SYehuda Sadeh struct ceph_eversion r_reassert_version; 963d14c5d2SYehuda Sadeh struct list_head r_unsafe_item; 973d14c5d2SYehuda Sadeh 983d14c5d2SYehuda Sadeh struct inode *r_inode; /* for use by callbacks */ 993d14c5d2SYehuda Sadeh void *r_priv; /* ditto */ 1003d14c5d2SYehuda Sadeh 101224736d9SStratos Psomadakis char r_oid[MAX_OBJ_NAME_SIZE]; /* object name */ 1023d14c5d2SYehuda Sadeh int r_oid_len; 1032169aea6SSage Weil u64 r_snapid; 1043d14c5d2SYehuda Sadeh unsigned long r_stamp; /* send OR check time */ 1053d14c5d2SYehuda Sadeh 1063d14c5d2SYehuda Sadeh struct ceph_file_layout r_file_layout; 1073d14c5d2SYehuda Sadeh struct ceph_snap_context *r_snapc; /* snap context for writes */ 1083d14c5d2SYehuda Sadeh unsigned r_num_pages; /* size of page array (follows) */ 109b7495fc2SSage Weil unsigned r_page_alignment; /* io offset in first page */ 1103d14c5d2SYehuda Sadeh struct page **r_pages; /* pages for data payload */ 1113d14c5d2SYehuda Sadeh int r_pages_from_pool; 1123d14c5d2SYehuda Sadeh int r_own_pages; /* if true, i own page list */ 1133d14c5d2SYehuda Sadeh #ifdef CONFIG_BLOCK 1143d14c5d2SYehuda Sadeh struct bio *r_bio; /* instead of pages */ 1153d14c5d2SYehuda Sadeh #endif 1163d14c5d2SYehuda Sadeh 117c885837fSAlex Elder struct ceph_pagelist r_trail; /* trailing part of the data */ 1183d14c5d2SYehuda Sadeh }; 1193d14c5d2SYehuda Sadeh 120a40c4f10SYehuda Sadeh struct ceph_osd_event { 121a40c4f10SYehuda Sadeh u64 cookie; 122a40c4f10SYehuda Sadeh int one_shot; 123a40c4f10SYehuda Sadeh struct ceph_osd_client *osdc; 124a40c4f10SYehuda Sadeh void (*cb)(u64, u64, u8, void *); 125a40c4f10SYehuda Sadeh void *data; 126a40c4f10SYehuda Sadeh struct rb_node node; 127a40c4f10SYehuda Sadeh struct list_head osd_node; 128a40c4f10SYehuda Sadeh struct kref kref; 129a40c4f10SYehuda Sadeh }; 130a40c4f10SYehuda Sadeh 131a40c4f10SYehuda Sadeh struct ceph_osd_event_work { 132a40c4f10SYehuda Sadeh struct work_struct work; 133a40c4f10SYehuda Sadeh struct ceph_osd_event *event; 134a40c4f10SYehuda Sadeh u64 ver; 135a40c4f10SYehuda Sadeh u64 notify_id; 136a40c4f10SYehuda Sadeh u8 opcode; 137a40c4f10SYehuda Sadeh }; 138a40c4f10SYehuda Sadeh 1393d14c5d2SYehuda Sadeh struct ceph_osd_client { 1403d14c5d2SYehuda Sadeh struct ceph_client *client; 1413d14c5d2SYehuda Sadeh 1423d14c5d2SYehuda Sadeh struct ceph_osdmap *osdmap; /* current map */ 1433d14c5d2SYehuda Sadeh struct rw_semaphore map_sem; 1443d14c5d2SYehuda Sadeh struct completion map_waiters; 1453d14c5d2SYehuda Sadeh u64 last_requested_map; 1463d14c5d2SYehuda Sadeh 1473d14c5d2SYehuda Sadeh struct mutex request_mutex; 1483d14c5d2SYehuda Sadeh struct rb_root osds; /* osds */ 1493d14c5d2SYehuda Sadeh struct list_head osd_lru; /* idle osds */ 1503d14c5d2SYehuda Sadeh u64 timeout_tid; /* tid of timeout triggering rq */ 1513d14c5d2SYehuda Sadeh u64 last_tid; /* tid of last request */ 1523d14c5d2SYehuda Sadeh struct rb_root requests; /* pending requests */ 1536f6c7006SSage Weil struct list_head req_lru; /* in-flight lru */ 1546f6c7006SSage Weil struct list_head req_unsent; /* unsent/need-resend queue */ 1556f6c7006SSage Weil struct list_head req_notarget; /* map to no osd */ 156a40c4f10SYehuda Sadeh struct list_head req_linger; /* lingering requests */ 1573d14c5d2SYehuda Sadeh int num_requests; 1583d14c5d2SYehuda Sadeh struct delayed_work timeout_work; 1593d14c5d2SYehuda Sadeh struct delayed_work osds_timeout_work; 1603d14c5d2SYehuda Sadeh #ifdef CONFIG_DEBUG_FS 1613d14c5d2SYehuda Sadeh struct dentry *debugfs_file; 1623d14c5d2SYehuda Sadeh #endif 1633d14c5d2SYehuda Sadeh 1643d14c5d2SYehuda Sadeh mempool_t *req_mempool; 1653d14c5d2SYehuda Sadeh 1663d14c5d2SYehuda Sadeh struct ceph_msgpool msgpool_op; 1673d14c5d2SYehuda Sadeh struct ceph_msgpool msgpool_op_reply; 168a40c4f10SYehuda Sadeh 169a40c4f10SYehuda Sadeh spinlock_t event_lock; 170a40c4f10SYehuda Sadeh struct rb_root event_tree; 171a40c4f10SYehuda Sadeh u64 event_count; 172a40c4f10SYehuda Sadeh 173a40c4f10SYehuda Sadeh struct workqueue_struct *notify_wq; 1743d14c5d2SYehuda Sadeh }; 1753d14c5d2SYehuda Sadeh 1763d14c5d2SYehuda Sadeh struct ceph_osd_req_op { 1773d14c5d2SYehuda Sadeh u16 op; /* CEPH_OSD_OP_* */ 178e7e319a9SAlex Elder u32 payload_len; 1793d14c5d2SYehuda Sadeh union { 1803d14c5d2SYehuda Sadeh struct { 1813d14c5d2SYehuda Sadeh u64 offset, length; 1823d14c5d2SYehuda Sadeh u64 truncate_size; 1833d14c5d2SYehuda Sadeh u32 truncate_seq; 1843d14c5d2SYehuda Sadeh } extent; 1853d14c5d2SYehuda Sadeh struct { 1863d14c5d2SYehuda Sadeh const char *name; 1872a24d1f4SAlex Elder const void *val; 188e7e319a9SAlex Elder u32 name_len; 1893d14c5d2SYehuda Sadeh u32 value_len; 1903d14c5d2SYehuda Sadeh __u8 cmp_op; /* CEPH_OSD_CMPXATTR_OP_* */ 1913d14c5d2SYehuda Sadeh __u8 cmp_mode; /* CEPH_OSD_CMPXATTR_MODE_* */ 1923d14c5d2SYehuda Sadeh } xattr; 1933d14c5d2SYehuda Sadeh struct { 1943d14c5d2SYehuda Sadeh const char *class_name; 1953d14c5d2SYehuda Sadeh const char *method_name; 1962a24d1f4SAlex Elder const void *indata; 1973d14c5d2SYehuda Sadeh u32 indata_len; 198e7e319a9SAlex Elder __u8 class_len; 199e7e319a9SAlex Elder __u8 method_len; 200e7e319a9SAlex Elder __u8 argc; 2013d14c5d2SYehuda Sadeh } cls; 2023d14c5d2SYehuda Sadeh struct { 203e7e319a9SAlex Elder u64 cookie; 204e7e319a9SAlex Elder u64 count; 2053d14c5d2SYehuda Sadeh } pgls; 2063d14c5d2SYehuda Sadeh struct { 2073d14c5d2SYehuda Sadeh u64 snapid; 2083d14c5d2SYehuda Sadeh } snap; 209a40c4f10SYehuda Sadeh struct { 210a40c4f10SYehuda Sadeh u64 cookie; 211a40c4f10SYehuda Sadeh u64 ver; 212a40c4f10SYehuda Sadeh u32 prot_ver; 213a40c4f10SYehuda Sadeh u32 timeout; 214e7e319a9SAlex Elder __u8 flag; 215a40c4f10SYehuda Sadeh } watch; 2163d14c5d2SYehuda Sadeh }; 2173d14c5d2SYehuda Sadeh }; 2183d14c5d2SYehuda Sadeh 2193d14c5d2SYehuda Sadeh extern int ceph_osdc_init(struct ceph_osd_client *osdc, 2203d14c5d2SYehuda Sadeh struct ceph_client *client); 2213d14c5d2SYehuda Sadeh extern void ceph_osdc_stop(struct ceph_osd_client *osdc); 2223d14c5d2SYehuda Sadeh 2233d14c5d2SYehuda Sadeh extern void ceph_osdc_handle_reply(struct ceph_osd_client *osdc, 2243d14c5d2SYehuda Sadeh struct ceph_msg *msg); 2253d14c5d2SYehuda Sadeh extern void ceph_osdc_handle_map(struct ceph_osd_client *osdc, 2263d14c5d2SYehuda Sadeh struct ceph_msg *msg); 2273d14c5d2SYehuda Sadeh 2283d14c5d2SYehuda Sadeh extern struct ceph_osd_request *ceph_osdc_alloc_request(struct ceph_osd_client *osdc, 2293d14c5d2SYehuda Sadeh struct ceph_snap_context *snapc, 230ae7ca4a3SAlex Elder unsigned int num_op, 2313d14c5d2SYehuda Sadeh bool use_mempool, 23254a54007SAlex Elder gfp_t gfp_flags); 2333d14c5d2SYehuda Sadeh 2343d14c5d2SYehuda Sadeh extern void ceph_osdc_build_request(struct ceph_osd_request *req, 2350120be3cSAlex Elder u64 off, u64 len, 236ae7ca4a3SAlex Elder unsigned int num_op, 2373d14c5d2SYehuda Sadeh struct ceph_osd_req_op *src_ops, 2383d14c5d2SYehuda Sadeh struct ceph_snap_context *snapc, 2394d6b250bSAlex Elder u64 snap_id, 240af77f26cSAlex Elder struct timespec *mtime); 2413d14c5d2SYehuda Sadeh 2423d14c5d2SYehuda Sadeh extern struct ceph_osd_request *ceph_osdc_new_request(struct ceph_osd_client *, 2433d14c5d2SYehuda Sadeh struct ceph_file_layout *layout, 2443d14c5d2SYehuda Sadeh struct ceph_vino vino, 2453d14c5d2SYehuda Sadeh u64 offset, u64 *len, int op, int flags, 2463d14c5d2SYehuda Sadeh struct ceph_snap_context *snapc, 2473d14c5d2SYehuda Sadeh int do_sync, u32 truncate_seq, 2483d14c5d2SYehuda Sadeh u64 truncate_size, 2493d14c5d2SYehuda Sadeh struct timespec *mtime, 250153e5167SAlex Elder bool use_mempool); 2513d14c5d2SYehuda Sadeh 252a40c4f10SYehuda Sadeh extern void ceph_osdc_set_request_linger(struct ceph_osd_client *osdc, 253a40c4f10SYehuda Sadeh struct ceph_osd_request *req); 254a40c4f10SYehuda Sadeh extern void ceph_osdc_unregister_linger_request(struct ceph_osd_client *osdc, 255a40c4f10SYehuda Sadeh struct ceph_osd_request *req); 256a40c4f10SYehuda Sadeh 2573d14c5d2SYehuda Sadeh static inline void ceph_osdc_get_request(struct ceph_osd_request *req) 2583d14c5d2SYehuda Sadeh { 2593d14c5d2SYehuda Sadeh kref_get(&req->r_kref); 2603d14c5d2SYehuda Sadeh } 2613d14c5d2SYehuda Sadeh extern void ceph_osdc_release_request(struct kref *kref); 2623d14c5d2SYehuda Sadeh static inline void ceph_osdc_put_request(struct ceph_osd_request *req) 2633d14c5d2SYehuda Sadeh { 2643d14c5d2SYehuda Sadeh kref_put(&req->r_kref, ceph_osdc_release_request); 2653d14c5d2SYehuda Sadeh } 2663d14c5d2SYehuda Sadeh 2673d14c5d2SYehuda Sadeh extern int ceph_osdc_start_request(struct ceph_osd_client *osdc, 2683d14c5d2SYehuda Sadeh struct ceph_osd_request *req, 2693d14c5d2SYehuda Sadeh bool nofail); 2703d14c5d2SYehuda Sadeh extern int ceph_osdc_wait_request(struct ceph_osd_client *osdc, 2713d14c5d2SYehuda Sadeh struct ceph_osd_request *req); 2723d14c5d2SYehuda Sadeh extern void ceph_osdc_sync(struct ceph_osd_client *osdc); 2733d14c5d2SYehuda Sadeh 2743d14c5d2SYehuda Sadeh extern int ceph_osdc_readpages(struct ceph_osd_client *osdc, 2753d14c5d2SYehuda Sadeh struct ceph_vino vino, 2763d14c5d2SYehuda Sadeh struct ceph_file_layout *layout, 2773d14c5d2SYehuda Sadeh u64 off, u64 *plen, 2783d14c5d2SYehuda Sadeh u32 truncate_seq, u64 truncate_size, 279b7495fc2SSage Weil struct page **pages, int nr_pages, 280b7495fc2SSage Weil int page_align); 2813d14c5d2SYehuda Sadeh 2823d14c5d2SYehuda Sadeh extern int ceph_osdc_writepages(struct ceph_osd_client *osdc, 2833d14c5d2SYehuda Sadeh struct ceph_vino vino, 2843d14c5d2SYehuda Sadeh struct ceph_file_layout *layout, 2853d14c5d2SYehuda Sadeh struct ceph_snap_context *sc, 2863d14c5d2SYehuda Sadeh u64 off, u64 len, 2873d14c5d2SYehuda Sadeh u32 truncate_seq, u64 truncate_size, 2883d14c5d2SYehuda Sadeh struct timespec *mtime, 28924808826SAlex Elder struct page **pages, int nr_pages); 2903d14c5d2SYehuda Sadeh 291a40c4f10SYehuda Sadeh /* watch/notify events */ 292a40c4f10SYehuda Sadeh extern int ceph_osdc_create_event(struct ceph_osd_client *osdc, 293a40c4f10SYehuda Sadeh void (*event_cb)(u64, u64, u8, void *), 2943c663bbdSAlex Elder void *data, struct ceph_osd_event **pevent); 295a40c4f10SYehuda Sadeh extern void ceph_osdc_cancel_event(struct ceph_osd_event *event); 296a40c4f10SYehuda Sadeh extern void ceph_osdc_put_event(struct ceph_osd_event *event); 2973d14c5d2SYehuda Sadeh #endif 2983d14c5d2SYehuda Sadeh 299