13d14c5d2SYehuda Sadeh #ifndef _FS_CEPH_OSD_CLIENT_H 23d14c5d2SYehuda Sadeh #define _FS_CEPH_OSD_CLIENT_H 33d14c5d2SYehuda Sadeh 43d14c5d2SYehuda Sadeh #include <linux/completion.h> 53d14c5d2SYehuda Sadeh #include <linux/kref.h> 63d14c5d2SYehuda Sadeh #include <linux/mempool.h> 73d14c5d2SYehuda Sadeh #include <linux/rbtree.h> 83d14c5d2SYehuda Sadeh 96c4a1915SAlex Elder #include <linux/ceph/types.h> 106c4a1915SAlex Elder #include <linux/ceph/osdmap.h> 116c4a1915SAlex Elder #include <linux/ceph/messenger.h> 126c4a1915SAlex Elder #include <linux/ceph/auth.h> 13c885837fSAlex Elder #include <linux/ceph/pagelist.h> 143d14c5d2SYehuda Sadeh 15224736d9SStratos Psomadakis /* 16224736d9SStratos Psomadakis * Maximum object name size 17224736d9SStratos Psomadakis * (must be at least as big as RBD_MAX_MD_NAME_LEN -- currently 100) 18224736d9SStratos Psomadakis */ 19224736d9SStratos Psomadakis #define MAX_OBJ_NAME_SIZE 100 20224736d9SStratos Psomadakis 213d14c5d2SYehuda Sadeh struct ceph_msg; 223d14c5d2SYehuda Sadeh struct ceph_snap_context; 233d14c5d2SYehuda Sadeh struct ceph_osd_request; 243d14c5d2SYehuda Sadeh struct ceph_osd_client; 253d14c5d2SYehuda Sadeh struct ceph_authorizer; 263d14c5d2SYehuda Sadeh 273d14c5d2SYehuda Sadeh /* 283d14c5d2SYehuda Sadeh * completion callback for async writepages 293d14c5d2SYehuda Sadeh */ 303d14c5d2SYehuda Sadeh typedef void (*ceph_osdc_callback_t)(struct ceph_osd_request *, 313d14c5d2SYehuda Sadeh struct ceph_msg *); 323d14c5d2SYehuda Sadeh 333d14c5d2SYehuda Sadeh /* a given osd we're communicating with */ 343d14c5d2SYehuda Sadeh struct ceph_osd { 353d14c5d2SYehuda Sadeh atomic_t o_ref; 363d14c5d2SYehuda Sadeh struct ceph_osd_client *o_osdc; 373d14c5d2SYehuda Sadeh int o_osd; 383d14c5d2SYehuda Sadeh int o_incarnation; 393d14c5d2SYehuda Sadeh struct rb_node o_node; 403d14c5d2SYehuda Sadeh struct ceph_connection o_con; 413d14c5d2SYehuda Sadeh struct list_head o_requests; 42a40c4f10SYehuda Sadeh struct list_head o_linger_requests; 433d14c5d2SYehuda Sadeh struct list_head o_osd_lru; 446c4a1915SAlex Elder struct ceph_auth_handshake o_auth; 453d14c5d2SYehuda Sadeh unsigned long lru_ttl; 463d14c5d2SYehuda Sadeh int o_marked_for_keepalive; 473d14c5d2SYehuda Sadeh struct list_head o_keepalive_item; 483d14c5d2SYehuda Sadeh }; 493d14c5d2SYehuda Sadeh 501b83bef2SSage Weil 511b83bef2SSage Weil #define CEPH_OSD_MAX_OP 10 521b83bef2SSage Weil 532ac2b7a6SAlex Elder enum ceph_osd_data_type { 542ac2b7a6SAlex Elder CEPH_OSD_DATA_TYPE_NONE, 552ac2b7a6SAlex Elder CEPH_OSD_DATA_TYPE_PAGES, 569a5e6d09SAlex Elder CEPH_OSD_DATA_TYPE_PAGELIST, 572ac2b7a6SAlex Elder #ifdef CONFIG_BLOCK 582ac2b7a6SAlex Elder CEPH_OSD_DATA_TYPE_BIO, 592ac2b7a6SAlex Elder #endif /* CONFIG_BLOCK */ 602ac2b7a6SAlex Elder }; 612ac2b7a6SAlex Elder 622794a82aSAlex Elder struct ceph_osd_data { 632ac2b7a6SAlex Elder enum ceph_osd_data_type type; 642ac2b7a6SAlex Elder union { 652794a82aSAlex Elder struct { 662794a82aSAlex Elder struct page **pages; 67e0c59487SAlex Elder u64 length; 682794a82aSAlex Elder u32 alignment; 692794a82aSAlex Elder bool pages_from_pool; 702794a82aSAlex Elder bool own_pages; 712794a82aSAlex Elder }; 729a5e6d09SAlex Elder struct ceph_pagelist *pagelist; 732794a82aSAlex Elder #ifdef CONFIG_BLOCK 74fdce58ccSAlex Elder struct { 75fdce58ccSAlex Elder struct bio *bio; /* list of bios */ 76fdce58ccSAlex Elder size_t bio_length; /* total in list */ 77fdce58ccSAlex Elder }; 782794a82aSAlex Elder #endif /* CONFIG_BLOCK */ 792794a82aSAlex Elder }; 802794a82aSAlex Elder }; 812794a82aSAlex Elder 823d14c5d2SYehuda Sadeh /* an in-flight request */ 833d14c5d2SYehuda Sadeh struct ceph_osd_request { 843d14c5d2SYehuda Sadeh u64 r_tid; /* unique for this client */ 853d14c5d2SYehuda Sadeh struct rb_node r_node; 863d14c5d2SYehuda Sadeh struct list_head r_req_lru_item; 873d14c5d2SYehuda Sadeh struct list_head r_osd_item; 88a40c4f10SYehuda Sadeh struct list_head r_linger_item; 89a40c4f10SYehuda Sadeh struct list_head r_linger_osd; 903d14c5d2SYehuda Sadeh struct ceph_osd *r_osd; 915b191d99SSage Weil struct ceph_pg r_pgid; 923d14c5d2SYehuda Sadeh int r_pg_osds[CEPH_PG_MAX_SIZE]; 933d14c5d2SYehuda Sadeh int r_num_pg_osds; 943d14c5d2SYehuda Sadeh 953d14c5d2SYehuda Sadeh struct ceph_msg *r_request, *r_reply; 963d14c5d2SYehuda Sadeh int r_flags; /* any additional flags for the osd */ 973d14c5d2SYehuda Sadeh u32 r_sent; /* >0 if r_request is sending/sent */ 981b83bef2SSage Weil int r_num_ops; 991b83bef2SSage Weil 1001b83bef2SSage Weil /* encoded message content */ 1011b83bef2SSage Weil struct ceph_osd_op *r_request_ops; 1021b83bef2SSage Weil /* these are updated on each send */ 1031b83bef2SSage Weil __le32 *r_request_osdmap_epoch; 1041b83bef2SSage Weil __le32 *r_request_flags; 1051b83bef2SSage Weil __le64 *r_request_pool; 1061b83bef2SSage Weil void *r_request_pgid; 1071b83bef2SSage Weil __le32 *r_request_attempts; 1081b83bef2SSage Weil struct ceph_eversion *r_request_reassert_version; 1091b83bef2SSage Weil 1101b83bef2SSage Weil int r_result; 1111b83bef2SSage Weil int r_reply_op_len[CEPH_OSD_MAX_OP]; 1121b83bef2SSage Weil s32 r_reply_op_result[CEPH_OSD_MAX_OP]; 1133d14c5d2SYehuda Sadeh int r_got_reply; 114a40c4f10SYehuda Sadeh int r_linger; 1150d5af164SAlex Elder int r_completed; 1163d14c5d2SYehuda Sadeh 1173d14c5d2SYehuda Sadeh struct ceph_osd_client *r_osdc; 1183d14c5d2SYehuda Sadeh struct kref r_kref; 1193d14c5d2SYehuda Sadeh bool r_mempool; 1203d14c5d2SYehuda Sadeh struct completion r_completion, r_safe_completion; 1213d14c5d2SYehuda Sadeh ceph_osdc_callback_t r_callback, r_safe_callback; 1223d14c5d2SYehuda Sadeh struct ceph_eversion r_reassert_version; 1233d14c5d2SYehuda Sadeh struct list_head r_unsafe_item; 1243d14c5d2SYehuda Sadeh 1253d14c5d2SYehuda Sadeh struct inode *r_inode; /* for use by callbacks */ 1263d14c5d2SYehuda Sadeh void *r_priv; /* ditto */ 1273d14c5d2SYehuda Sadeh 128224736d9SStratos Psomadakis char r_oid[MAX_OBJ_NAME_SIZE]; /* object name */ 1293d14c5d2SYehuda Sadeh int r_oid_len; 1302169aea6SSage Weil u64 r_snapid; 1313d14c5d2SYehuda Sadeh unsigned long r_stamp; /* send OR check time */ 1323d14c5d2SYehuda Sadeh 1333d14c5d2SYehuda Sadeh struct ceph_file_layout r_file_layout; 1343d14c5d2SYehuda Sadeh struct ceph_snap_context *r_snapc; /* snap context for writes */ 1353d14c5d2SYehuda Sadeh 1360fff87ecSAlex Elder struct ceph_osd_data r_data_in; 1370fff87ecSAlex Elder struct ceph_osd_data r_data_out; 1383d14c5d2SYehuda Sadeh }; 1393d14c5d2SYehuda Sadeh 140a40c4f10SYehuda Sadeh struct ceph_osd_event { 141a40c4f10SYehuda Sadeh u64 cookie; 142a40c4f10SYehuda Sadeh int one_shot; 143a40c4f10SYehuda Sadeh struct ceph_osd_client *osdc; 144a40c4f10SYehuda Sadeh void (*cb)(u64, u64, u8, void *); 145a40c4f10SYehuda Sadeh void *data; 146a40c4f10SYehuda Sadeh struct rb_node node; 147a40c4f10SYehuda Sadeh struct list_head osd_node; 148a40c4f10SYehuda Sadeh struct kref kref; 149a40c4f10SYehuda Sadeh }; 150a40c4f10SYehuda Sadeh 151a40c4f10SYehuda Sadeh struct ceph_osd_event_work { 152a40c4f10SYehuda Sadeh struct work_struct work; 153a40c4f10SYehuda Sadeh struct ceph_osd_event *event; 154a40c4f10SYehuda Sadeh u64 ver; 155a40c4f10SYehuda Sadeh u64 notify_id; 156a40c4f10SYehuda Sadeh u8 opcode; 157a40c4f10SYehuda Sadeh }; 158a40c4f10SYehuda Sadeh 1593d14c5d2SYehuda Sadeh struct ceph_osd_client { 1603d14c5d2SYehuda Sadeh struct ceph_client *client; 1613d14c5d2SYehuda Sadeh 1623d14c5d2SYehuda Sadeh struct ceph_osdmap *osdmap; /* current map */ 1633d14c5d2SYehuda Sadeh struct rw_semaphore map_sem; 1643d14c5d2SYehuda Sadeh struct completion map_waiters; 1653d14c5d2SYehuda Sadeh u64 last_requested_map; 1663d14c5d2SYehuda Sadeh 1673d14c5d2SYehuda Sadeh struct mutex request_mutex; 1683d14c5d2SYehuda Sadeh struct rb_root osds; /* osds */ 1693d14c5d2SYehuda Sadeh struct list_head osd_lru; /* idle osds */ 1703d14c5d2SYehuda Sadeh u64 timeout_tid; /* tid of timeout triggering rq */ 1713d14c5d2SYehuda Sadeh u64 last_tid; /* tid of last request */ 1723d14c5d2SYehuda Sadeh struct rb_root requests; /* pending requests */ 1736f6c7006SSage Weil struct list_head req_lru; /* in-flight lru */ 1746f6c7006SSage Weil struct list_head req_unsent; /* unsent/need-resend queue */ 1756f6c7006SSage Weil struct list_head req_notarget; /* map to no osd */ 176a40c4f10SYehuda Sadeh struct list_head req_linger; /* lingering requests */ 1773d14c5d2SYehuda Sadeh int num_requests; 1783d14c5d2SYehuda Sadeh struct delayed_work timeout_work; 1793d14c5d2SYehuda Sadeh struct delayed_work osds_timeout_work; 1803d14c5d2SYehuda Sadeh #ifdef CONFIG_DEBUG_FS 1813d14c5d2SYehuda Sadeh struct dentry *debugfs_file; 1823d14c5d2SYehuda Sadeh #endif 1833d14c5d2SYehuda Sadeh 1843d14c5d2SYehuda Sadeh mempool_t *req_mempool; 1853d14c5d2SYehuda Sadeh 1863d14c5d2SYehuda Sadeh struct ceph_msgpool msgpool_op; 1873d14c5d2SYehuda Sadeh struct ceph_msgpool msgpool_op_reply; 188a40c4f10SYehuda Sadeh 189a40c4f10SYehuda Sadeh spinlock_t event_lock; 190a40c4f10SYehuda Sadeh struct rb_root event_tree; 191a40c4f10SYehuda Sadeh u64 event_count; 192a40c4f10SYehuda Sadeh 193a40c4f10SYehuda Sadeh struct workqueue_struct *notify_wq; 1943d14c5d2SYehuda Sadeh }; 1953d14c5d2SYehuda Sadeh 1963d14c5d2SYehuda Sadeh struct ceph_osd_req_op { 1973d14c5d2SYehuda Sadeh u16 op; /* CEPH_OSD_OP_* */ 198e7e319a9SAlex Elder u32 payload_len; 1993d14c5d2SYehuda Sadeh union { 2003d14c5d2SYehuda Sadeh struct { 2013d14c5d2SYehuda Sadeh u64 offset, length; 2023d14c5d2SYehuda Sadeh u64 truncate_size; 2033d14c5d2SYehuda Sadeh u32 truncate_seq; 2043d14c5d2SYehuda Sadeh } extent; 2053d14c5d2SYehuda Sadeh struct { 2063d14c5d2SYehuda Sadeh const char *class_name; 2073d14c5d2SYehuda Sadeh const char *method_name; 2082a24d1f4SAlex Elder const void *indata; 2093d14c5d2SYehuda Sadeh u32 indata_len; 210e7e319a9SAlex Elder __u8 class_len; 211e7e319a9SAlex Elder __u8 method_len; 212e7e319a9SAlex Elder __u8 argc; 2133d14c5d2SYehuda Sadeh } cls; 2143d14c5d2SYehuda Sadeh struct { 215e7e319a9SAlex Elder u64 cookie; 216a40c4f10SYehuda Sadeh u64 ver; 217a40c4f10SYehuda Sadeh u32 prot_ver; 218a40c4f10SYehuda Sadeh u32 timeout; 219e7e319a9SAlex Elder __u8 flag; 220a40c4f10SYehuda Sadeh } watch; 2213d14c5d2SYehuda Sadeh }; 2223d14c5d2SYehuda Sadeh }; 2233d14c5d2SYehuda Sadeh 2243d14c5d2SYehuda Sadeh extern int ceph_osdc_init(struct ceph_osd_client *osdc, 2253d14c5d2SYehuda Sadeh struct ceph_client *client); 2263d14c5d2SYehuda Sadeh extern void ceph_osdc_stop(struct ceph_osd_client *osdc); 2273d14c5d2SYehuda Sadeh 2283d14c5d2SYehuda Sadeh extern void ceph_osdc_handle_reply(struct ceph_osd_client *osdc, 2293d14c5d2SYehuda Sadeh struct ceph_msg *msg); 2303d14c5d2SYehuda Sadeh extern void ceph_osdc_handle_map(struct ceph_osd_client *osdc, 2313d14c5d2SYehuda Sadeh struct ceph_msg *msg); 2323d14c5d2SYehuda Sadeh 23333803f33SAlex Elder extern void osd_req_op_init(struct ceph_osd_req_op *op, u16 opcode); 23433803f33SAlex Elder extern void osd_req_op_extent_init(struct ceph_osd_req_op *op, u16 opcode, 23533803f33SAlex Elder u64 offset, u64 length, 23633803f33SAlex Elder u64 truncate_size, u32 truncate_seq); 23733803f33SAlex Elder extern void osd_req_op_cls_init(struct ceph_osd_req_op *op, u16 opcode, 23833803f33SAlex Elder const char *class, const char *method, 23933803f33SAlex Elder const void *request_data, 24033803f33SAlex Elder size_t request_data_size); 24133803f33SAlex Elder extern void osd_req_op_watch_init(struct ceph_osd_req_op *op, u16 opcode, 24233803f33SAlex Elder u64 cookie, u64 version, int flag); 24333803f33SAlex Elder 2443d14c5d2SYehuda Sadeh extern struct ceph_osd_request *ceph_osdc_alloc_request(struct ceph_osd_client *osdc, 2453d14c5d2SYehuda Sadeh struct ceph_snap_context *snapc, 246acead002SAlex Elder unsigned int num_ops, 2473d14c5d2SYehuda Sadeh bool use_mempool, 24854a54007SAlex Elder gfp_t gfp_flags); 2493d14c5d2SYehuda Sadeh 250175face2SAlex Elder extern void ceph_osdc_build_request(struct ceph_osd_request *req, u64 off, 251acead002SAlex Elder unsigned int num_ops, 2523d14c5d2SYehuda Sadeh struct ceph_osd_req_op *src_ops, 2533d14c5d2SYehuda Sadeh struct ceph_snap_context *snapc, 2544d6b250bSAlex Elder u64 snap_id, 255af77f26cSAlex Elder struct timespec *mtime); 2563d14c5d2SYehuda Sadeh 2573d14c5d2SYehuda Sadeh extern struct ceph_osd_request *ceph_osdc_new_request(struct ceph_osd_client *, 2583d14c5d2SYehuda Sadeh struct ceph_file_layout *layout, 2593d14c5d2SYehuda Sadeh struct ceph_vino vino, 260acead002SAlex Elder u64 offset, u64 *len, 261acead002SAlex Elder int num_ops, struct ceph_osd_req_op *ops, 262acead002SAlex Elder int opcode, int flags, 2633d14c5d2SYehuda Sadeh struct ceph_snap_context *snapc, 264acead002SAlex Elder u32 truncate_seq, u64 truncate_size, 265153e5167SAlex Elder bool use_mempool); 2663d14c5d2SYehuda Sadeh 267a40c4f10SYehuda Sadeh extern void ceph_osdc_set_request_linger(struct ceph_osd_client *osdc, 268a40c4f10SYehuda Sadeh struct ceph_osd_request *req); 269a40c4f10SYehuda Sadeh extern void ceph_osdc_unregister_linger_request(struct ceph_osd_client *osdc, 270a40c4f10SYehuda Sadeh struct ceph_osd_request *req); 271a40c4f10SYehuda Sadeh 2723d14c5d2SYehuda Sadeh static inline void ceph_osdc_get_request(struct ceph_osd_request *req) 2733d14c5d2SYehuda Sadeh { 2743d14c5d2SYehuda Sadeh kref_get(&req->r_kref); 2753d14c5d2SYehuda Sadeh } 2763d14c5d2SYehuda Sadeh extern void ceph_osdc_release_request(struct kref *kref); 2773d14c5d2SYehuda Sadeh static inline void ceph_osdc_put_request(struct ceph_osd_request *req) 2783d14c5d2SYehuda Sadeh { 2793d14c5d2SYehuda Sadeh kref_put(&req->r_kref, ceph_osdc_release_request); 2803d14c5d2SYehuda Sadeh } 2813d14c5d2SYehuda Sadeh 2823d14c5d2SYehuda Sadeh extern int ceph_osdc_start_request(struct ceph_osd_client *osdc, 2833d14c5d2SYehuda Sadeh struct ceph_osd_request *req, 2843d14c5d2SYehuda Sadeh bool nofail); 2853d14c5d2SYehuda Sadeh extern int ceph_osdc_wait_request(struct ceph_osd_client *osdc, 2863d14c5d2SYehuda Sadeh struct ceph_osd_request *req); 2873d14c5d2SYehuda Sadeh extern void ceph_osdc_sync(struct ceph_osd_client *osdc); 2883d14c5d2SYehuda Sadeh 2893d14c5d2SYehuda Sadeh extern int ceph_osdc_readpages(struct ceph_osd_client *osdc, 2903d14c5d2SYehuda Sadeh struct ceph_vino vino, 2913d14c5d2SYehuda Sadeh struct ceph_file_layout *layout, 2923d14c5d2SYehuda Sadeh u64 off, u64 *plen, 2933d14c5d2SYehuda Sadeh u32 truncate_seq, u64 truncate_size, 294b7495fc2SSage Weil struct page **pages, int nr_pages, 295b7495fc2SSage Weil int page_align); 2963d14c5d2SYehuda Sadeh 2973d14c5d2SYehuda Sadeh extern int ceph_osdc_writepages(struct ceph_osd_client *osdc, 2983d14c5d2SYehuda Sadeh struct ceph_vino vino, 2993d14c5d2SYehuda Sadeh struct ceph_file_layout *layout, 3003d14c5d2SYehuda Sadeh struct ceph_snap_context *sc, 3013d14c5d2SYehuda Sadeh u64 off, u64 len, 3023d14c5d2SYehuda Sadeh u32 truncate_seq, u64 truncate_size, 3033d14c5d2SYehuda Sadeh struct timespec *mtime, 30424808826SAlex Elder struct page **pages, int nr_pages); 3053d14c5d2SYehuda Sadeh 306a40c4f10SYehuda Sadeh /* watch/notify events */ 307a40c4f10SYehuda Sadeh extern int ceph_osdc_create_event(struct ceph_osd_client *osdc, 308a40c4f10SYehuda Sadeh void (*event_cb)(u64, u64, u8, void *), 3093c663bbdSAlex Elder void *data, struct ceph_osd_event **pevent); 310a40c4f10SYehuda Sadeh extern void ceph_osdc_cancel_event(struct ceph_osd_event *event); 311a40c4f10SYehuda Sadeh extern void ceph_osdc_put_event(struct ceph_osd_event *event); 3123d14c5d2SYehuda Sadeh #endif 3133d14c5d2SYehuda Sadeh 314