13d14c5d2SYehuda Sadeh #ifndef _FS_CEPH_OSD_CLIENT_H 23d14c5d2SYehuda Sadeh #define _FS_CEPH_OSD_CLIENT_H 33d14c5d2SYehuda Sadeh 43d14c5d2SYehuda Sadeh #include <linux/completion.h> 53d14c5d2SYehuda Sadeh #include <linux/kref.h> 63d14c5d2SYehuda Sadeh #include <linux/mempool.h> 73d14c5d2SYehuda Sadeh #include <linux/rbtree.h> 83d14c5d2SYehuda Sadeh 96c4a1915SAlex Elder #include <linux/ceph/types.h> 106c4a1915SAlex Elder #include <linux/ceph/osdmap.h> 116c4a1915SAlex Elder #include <linux/ceph/messenger.h> 126c4a1915SAlex Elder #include <linux/ceph/auth.h> 13c885837fSAlex Elder #include <linux/ceph/pagelist.h> 143d14c5d2SYehuda Sadeh 15224736d9SStratos Psomadakis /* 16224736d9SStratos Psomadakis * Maximum object name size 17224736d9SStratos Psomadakis * (must be at least as big as RBD_MAX_MD_NAME_LEN -- currently 100) 18224736d9SStratos Psomadakis */ 19224736d9SStratos Psomadakis #define MAX_OBJ_NAME_SIZE 100 20224736d9SStratos Psomadakis 213d14c5d2SYehuda Sadeh struct ceph_msg; 223d14c5d2SYehuda Sadeh struct ceph_snap_context; 233d14c5d2SYehuda Sadeh struct ceph_osd_request; 243d14c5d2SYehuda Sadeh struct ceph_osd_client; 253d14c5d2SYehuda Sadeh struct ceph_authorizer; 263d14c5d2SYehuda Sadeh 273d14c5d2SYehuda Sadeh /* 283d14c5d2SYehuda Sadeh * completion callback for async writepages 293d14c5d2SYehuda Sadeh */ 303d14c5d2SYehuda Sadeh typedef void (*ceph_osdc_callback_t)(struct ceph_osd_request *, 313d14c5d2SYehuda Sadeh struct ceph_msg *); 323d14c5d2SYehuda Sadeh 333d14c5d2SYehuda Sadeh /* a given osd we're communicating with */ 343d14c5d2SYehuda Sadeh struct ceph_osd { 353d14c5d2SYehuda Sadeh atomic_t o_ref; 363d14c5d2SYehuda Sadeh struct ceph_osd_client *o_osdc; 373d14c5d2SYehuda Sadeh int o_osd; 383d14c5d2SYehuda Sadeh int o_incarnation; 393d14c5d2SYehuda Sadeh struct rb_node o_node; 403d14c5d2SYehuda Sadeh struct ceph_connection o_con; 413d14c5d2SYehuda Sadeh struct list_head o_requests; 42a40c4f10SYehuda Sadeh struct list_head o_linger_requests; 433d14c5d2SYehuda Sadeh struct list_head o_osd_lru; 446c4a1915SAlex Elder struct ceph_auth_handshake o_auth; 453d14c5d2SYehuda Sadeh unsigned long lru_ttl; 463d14c5d2SYehuda Sadeh int o_marked_for_keepalive; 473d14c5d2SYehuda Sadeh struct list_head o_keepalive_item; 483d14c5d2SYehuda Sadeh }; 493d14c5d2SYehuda Sadeh 501b83bef2SSage Weil 511b83bef2SSage Weil #define CEPH_OSD_MAX_OP 10 521b83bef2SSage Weil 532ac2b7a6SAlex Elder enum ceph_osd_data_type { 542ac2b7a6SAlex Elder CEPH_OSD_DATA_TYPE_NONE, 552ac2b7a6SAlex Elder CEPH_OSD_DATA_TYPE_PAGES, 562ac2b7a6SAlex Elder #ifdef CONFIG_BLOCK 572ac2b7a6SAlex Elder CEPH_OSD_DATA_TYPE_BIO, 582ac2b7a6SAlex Elder #endif /* CONFIG_BLOCK */ 592ac2b7a6SAlex Elder }; 602ac2b7a6SAlex Elder 612794a82aSAlex Elder struct ceph_osd_data { 622ac2b7a6SAlex Elder enum ceph_osd_data_type type; 632ac2b7a6SAlex Elder union { 642794a82aSAlex Elder struct { 652794a82aSAlex Elder struct page **pages; 66e0c59487SAlex Elder u64 length; 672794a82aSAlex Elder u32 alignment; 682794a82aSAlex Elder bool pages_from_pool; 692794a82aSAlex Elder bool own_pages; 702794a82aSAlex Elder }; 712794a82aSAlex Elder #ifdef CONFIG_BLOCK 722794a82aSAlex Elder struct bio *bio; 732794a82aSAlex Elder #endif /* CONFIG_BLOCK */ 742794a82aSAlex Elder }; 752794a82aSAlex Elder }; 762794a82aSAlex Elder 773d14c5d2SYehuda Sadeh /* an in-flight request */ 783d14c5d2SYehuda Sadeh struct ceph_osd_request { 793d14c5d2SYehuda Sadeh u64 r_tid; /* unique for this client */ 803d14c5d2SYehuda Sadeh struct rb_node r_node; 813d14c5d2SYehuda Sadeh struct list_head r_req_lru_item; 823d14c5d2SYehuda Sadeh struct list_head r_osd_item; 83a40c4f10SYehuda Sadeh struct list_head r_linger_item; 84a40c4f10SYehuda Sadeh struct list_head r_linger_osd; 853d14c5d2SYehuda Sadeh struct ceph_osd *r_osd; 865b191d99SSage Weil struct ceph_pg r_pgid; 873d14c5d2SYehuda Sadeh int r_pg_osds[CEPH_PG_MAX_SIZE]; 883d14c5d2SYehuda Sadeh int r_num_pg_osds; 893d14c5d2SYehuda Sadeh 903d14c5d2SYehuda Sadeh struct ceph_connection *r_con_filling_msg; 913d14c5d2SYehuda Sadeh 923d14c5d2SYehuda Sadeh struct ceph_msg *r_request, *r_reply; 933d14c5d2SYehuda Sadeh int r_flags; /* any additional flags for the osd */ 943d14c5d2SYehuda Sadeh u32 r_sent; /* >0 if r_request is sending/sent */ 951b83bef2SSage Weil int r_num_ops; 961b83bef2SSage Weil 971b83bef2SSage Weil /* encoded message content */ 981b83bef2SSage Weil struct ceph_osd_op *r_request_ops; 991b83bef2SSage Weil /* these are updated on each send */ 1001b83bef2SSage Weil __le32 *r_request_osdmap_epoch; 1011b83bef2SSage Weil __le32 *r_request_flags; 1021b83bef2SSage Weil __le64 *r_request_pool; 1031b83bef2SSage Weil void *r_request_pgid; 1041b83bef2SSage Weil __le32 *r_request_attempts; 1051b83bef2SSage Weil struct ceph_eversion *r_request_reassert_version; 1061b83bef2SSage Weil 1071b83bef2SSage Weil int r_result; 1081b83bef2SSage Weil int r_reply_op_len[CEPH_OSD_MAX_OP]; 1091b83bef2SSage Weil s32 r_reply_op_result[CEPH_OSD_MAX_OP]; 1103d14c5d2SYehuda Sadeh int r_got_reply; 111a40c4f10SYehuda Sadeh int r_linger; 1120d5af164SAlex Elder int r_completed; 1133d14c5d2SYehuda Sadeh 1143d14c5d2SYehuda Sadeh struct ceph_osd_client *r_osdc; 1153d14c5d2SYehuda Sadeh struct kref r_kref; 1163d14c5d2SYehuda Sadeh bool r_mempool; 1173d14c5d2SYehuda Sadeh struct completion r_completion, r_safe_completion; 1183d14c5d2SYehuda Sadeh ceph_osdc_callback_t r_callback, r_safe_callback; 1193d14c5d2SYehuda Sadeh struct ceph_eversion r_reassert_version; 1203d14c5d2SYehuda Sadeh struct list_head r_unsafe_item; 1213d14c5d2SYehuda Sadeh 1223d14c5d2SYehuda Sadeh struct inode *r_inode; /* for use by callbacks */ 1233d14c5d2SYehuda Sadeh void *r_priv; /* ditto */ 1243d14c5d2SYehuda Sadeh 125224736d9SStratos Psomadakis char r_oid[MAX_OBJ_NAME_SIZE]; /* object name */ 1263d14c5d2SYehuda Sadeh int r_oid_len; 1272169aea6SSage Weil u64 r_snapid; 1283d14c5d2SYehuda Sadeh unsigned long r_stamp; /* send OR check time */ 1293d14c5d2SYehuda Sadeh 1303d14c5d2SYehuda Sadeh struct ceph_file_layout r_file_layout; 1313d14c5d2SYehuda Sadeh struct ceph_snap_context *r_snapc; /* snap context for writes */ 1323d14c5d2SYehuda Sadeh 1330fff87ecSAlex Elder struct ceph_osd_data r_data_in; 1340fff87ecSAlex Elder struct ceph_osd_data r_data_out; 1350fff87ecSAlex Elder struct ceph_pagelist r_trail; /* trailing part of data out */ 1363d14c5d2SYehuda Sadeh }; 1373d14c5d2SYehuda Sadeh 138a40c4f10SYehuda Sadeh struct ceph_osd_event { 139a40c4f10SYehuda Sadeh u64 cookie; 140a40c4f10SYehuda Sadeh int one_shot; 141a40c4f10SYehuda Sadeh struct ceph_osd_client *osdc; 142a40c4f10SYehuda Sadeh void (*cb)(u64, u64, u8, void *); 143a40c4f10SYehuda Sadeh void *data; 144a40c4f10SYehuda Sadeh struct rb_node node; 145a40c4f10SYehuda Sadeh struct list_head osd_node; 146a40c4f10SYehuda Sadeh struct kref kref; 147a40c4f10SYehuda Sadeh }; 148a40c4f10SYehuda Sadeh 149a40c4f10SYehuda Sadeh struct ceph_osd_event_work { 150a40c4f10SYehuda Sadeh struct work_struct work; 151a40c4f10SYehuda Sadeh struct ceph_osd_event *event; 152a40c4f10SYehuda Sadeh u64 ver; 153a40c4f10SYehuda Sadeh u64 notify_id; 154a40c4f10SYehuda Sadeh u8 opcode; 155a40c4f10SYehuda Sadeh }; 156a40c4f10SYehuda Sadeh 1573d14c5d2SYehuda Sadeh struct ceph_osd_client { 1583d14c5d2SYehuda Sadeh struct ceph_client *client; 1593d14c5d2SYehuda Sadeh 1603d14c5d2SYehuda Sadeh struct ceph_osdmap *osdmap; /* current map */ 1613d14c5d2SYehuda Sadeh struct rw_semaphore map_sem; 1623d14c5d2SYehuda Sadeh struct completion map_waiters; 1633d14c5d2SYehuda Sadeh u64 last_requested_map; 1643d14c5d2SYehuda Sadeh 1653d14c5d2SYehuda Sadeh struct mutex request_mutex; 1663d14c5d2SYehuda Sadeh struct rb_root osds; /* osds */ 1673d14c5d2SYehuda Sadeh struct list_head osd_lru; /* idle osds */ 1683d14c5d2SYehuda Sadeh u64 timeout_tid; /* tid of timeout triggering rq */ 1693d14c5d2SYehuda Sadeh u64 last_tid; /* tid of last request */ 1703d14c5d2SYehuda Sadeh struct rb_root requests; /* pending requests */ 1716f6c7006SSage Weil struct list_head req_lru; /* in-flight lru */ 1726f6c7006SSage Weil struct list_head req_unsent; /* unsent/need-resend queue */ 1736f6c7006SSage Weil struct list_head req_notarget; /* map to no osd */ 174a40c4f10SYehuda Sadeh struct list_head req_linger; /* lingering requests */ 1753d14c5d2SYehuda Sadeh int num_requests; 1763d14c5d2SYehuda Sadeh struct delayed_work timeout_work; 1773d14c5d2SYehuda Sadeh struct delayed_work osds_timeout_work; 1783d14c5d2SYehuda Sadeh #ifdef CONFIG_DEBUG_FS 1793d14c5d2SYehuda Sadeh struct dentry *debugfs_file; 1803d14c5d2SYehuda Sadeh #endif 1813d14c5d2SYehuda Sadeh 1823d14c5d2SYehuda Sadeh mempool_t *req_mempool; 1833d14c5d2SYehuda Sadeh 1843d14c5d2SYehuda Sadeh struct ceph_msgpool msgpool_op; 1853d14c5d2SYehuda Sadeh struct ceph_msgpool msgpool_op_reply; 186a40c4f10SYehuda Sadeh 187a40c4f10SYehuda Sadeh spinlock_t event_lock; 188a40c4f10SYehuda Sadeh struct rb_root event_tree; 189a40c4f10SYehuda Sadeh u64 event_count; 190a40c4f10SYehuda Sadeh 191a40c4f10SYehuda Sadeh struct workqueue_struct *notify_wq; 1923d14c5d2SYehuda Sadeh }; 1933d14c5d2SYehuda Sadeh 1943d14c5d2SYehuda Sadeh struct ceph_osd_req_op { 1953d14c5d2SYehuda Sadeh u16 op; /* CEPH_OSD_OP_* */ 196e7e319a9SAlex Elder u32 payload_len; 1973d14c5d2SYehuda Sadeh union { 1983d14c5d2SYehuda Sadeh struct { 1993d14c5d2SYehuda Sadeh u64 offset, length; 2003d14c5d2SYehuda Sadeh u64 truncate_size; 2013d14c5d2SYehuda Sadeh u32 truncate_seq; 2023d14c5d2SYehuda Sadeh } extent; 2033d14c5d2SYehuda Sadeh struct { 2043d14c5d2SYehuda Sadeh const char *name; 2052a24d1f4SAlex Elder const void *val; 206e7e319a9SAlex Elder u32 name_len; 2073d14c5d2SYehuda Sadeh u32 value_len; 2083d14c5d2SYehuda Sadeh __u8 cmp_op; /* CEPH_OSD_CMPXATTR_OP_* */ 2093d14c5d2SYehuda Sadeh __u8 cmp_mode; /* CEPH_OSD_CMPXATTR_MODE_* */ 2103d14c5d2SYehuda Sadeh } xattr; 2113d14c5d2SYehuda Sadeh struct { 2123d14c5d2SYehuda Sadeh const char *class_name; 2133d14c5d2SYehuda Sadeh const char *method_name; 2142a24d1f4SAlex Elder const void *indata; 2153d14c5d2SYehuda Sadeh u32 indata_len; 216e7e319a9SAlex Elder __u8 class_len; 217e7e319a9SAlex Elder __u8 method_len; 218e7e319a9SAlex Elder __u8 argc; 2193d14c5d2SYehuda Sadeh } cls; 2203d14c5d2SYehuda Sadeh struct { 221e7e319a9SAlex Elder u64 cookie; 222e7e319a9SAlex Elder u64 count; 2233d14c5d2SYehuda Sadeh } pgls; 2243d14c5d2SYehuda Sadeh struct { 2253d14c5d2SYehuda Sadeh u64 snapid; 2263d14c5d2SYehuda Sadeh } snap; 227a40c4f10SYehuda Sadeh struct { 228a40c4f10SYehuda Sadeh u64 cookie; 229a40c4f10SYehuda Sadeh u64 ver; 230a40c4f10SYehuda Sadeh u32 prot_ver; 231a40c4f10SYehuda Sadeh u32 timeout; 232e7e319a9SAlex Elder __u8 flag; 233a40c4f10SYehuda Sadeh } watch; 2343d14c5d2SYehuda Sadeh }; 2353d14c5d2SYehuda Sadeh }; 2363d14c5d2SYehuda Sadeh 2373d14c5d2SYehuda Sadeh extern int ceph_osdc_init(struct ceph_osd_client *osdc, 2383d14c5d2SYehuda Sadeh struct ceph_client *client); 2393d14c5d2SYehuda Sadeh extern void ceph_osdc_stop(struct ceph_osd_client *osdc); 2403d14c5d2SYehuda Sadeh 2413d14c5d2SYehuda Sadeh extern void ceph_osdc_handle_reply(struct ceph_osd_client *osdc, 2423d14c5d2SYehuda Sadeh struct ceph_msg *msg); 2433d14c5d2SYehuda Sadeh extern void ceph_osdc_handle_map(struct ceph_osd_client *osdc, 2443d14c5d2SYehuda Sadeh struct ceph_msg *msg); 2453d14c5d2SYehuda Sadeh 2463d14c5d2SYehuda Sadeh extern struct ceph_osd_request *ceph_osdc_alloc_request(struct ceph_osd_client *osdc, 2473d14c5d2SYehuda Sadeh struct ceph_snap_context *snapc, 248ae7ca4a3SAlex Elder unsigned int num_op, 2493d14c5d2SYehuda Sadeh bool use_mempool, 25054a54007SAlex Elder gfp_t gfp_flags); 2513d14c5d2SYehuda Sadeh 2523d14c5d2SYehuda Sadeh extern void ceph_osdc_build_request(struct ceph_osd_request *req, 2530120be3cSAlex Elder u64 off, u64 len, 254ae7ca4a3SAlex Elder unsigned int num_op, 2553d14c5d2SYehuda Sadeh struct ceph_osd_req_op *src_ops, 2563d14c5d2SYehuda Sadeh struct ceph_snap_context *snapc, 2574d6b250bSAlex Elder u64 snap_id, 258af77f26cSAlex Elder struct timespec *mtime); 2593d14c5d2SYehuda Sadeh 2603d14c5d2SYehuda Sadeh extern struct ceph_osd_request *ceph_osdc_new_request(struct ceph_osd_client *, 2613d14c5d2SYehuda Sadeh struct ceph_file_layout *layout, 2623d14c5d2SYehuda Sadeh struct ceph_vino vino, 2633d14c5d2SYehuda Sadeh u64 offset, u64 *len, int op, int flags, 2643d14c5d2SYehuda Sadeh struct ceph_snap_context *snapc, 2653d14c5d2SYehuda Sadeh int do_sync, u32 truncate_seq, 2663d14c5d2SYehuda Sadeh u64 truncate_size, 2673d14c5d2SYehuda Sadeh struct timespec *mtime, 268153e5167SAlex Elder bool use_mempool); 2693d14c5d2SYehuda Sadeh 270a40c4f10SYehuda Sadeh extern void ceph_osdc_set_request_linger(struct ceph_osd_client *osdc, 271a40c4f10SYehuda Sadeh struct ceph_osd_request *req); 272a40c4f10SYehuda Sadeh extern void ceph_osdc_unregister_linger_request(struct ceph_osd_client *osdc, 273a40c4f10SYehuda Sadeh struct ceph_osd_request *req); 274a40c4f10SYehuda Sadeh 2753d14c5d2SYehuda Sadeh static inline void ceph_osdc_get_request(struct ceph_osd_request *req) 2763d14c5d2SYehuda Sadeh { 2773d14c5d2SYehuda Sadeh kref_get(&req->r_kref); 2783d14c5d2SYehuda Sadeh } 2793d14c5d2SYehuda Sadeh extern void ceph_osdc_release_request(struct kref *kref); 2803d14c5d2SYehuda Sadeh static inline void ceph_osdc_put_request(struct ceph_osd_request *req) 2813d14c5d2SYehuda Sadeh { 2823d14c5d2SYehuda Sadeh kref_put(&req->r_kref, ceph_osdc_release_request); 2833d14c5d2SYehuda Sadeh } 2843d14c5d2SYehuda Sadeh 2853d14c5d2SYehuda Sadeh extern int ceph_osdc_start_request(struct ceph_osd_client *osdc, 2863d14c5d2SYehuda Sadeh struct ceph_osd_request *req, 2873d14c5d2SYehuda Sadeh bool nofail); 2883d14c5d2SYehuda Sadeh extern int ceph_osdc_wait_request(struct ceph_osd_client *osdc, 2893d14c5d2SYehuda Sadeh struct ceph_osd_request *req); 2903d14c5d2SYehuda Sadeh extern void ceph_osdc_sync(struct ceph_osd_client *osdc); 2913d14c5d2SYehuda Sadeh 2923d14c5d2SYehuda Sadeh extern int ceph_osdc_readpages(struct ceph_osd_client *osdc, 2933d14c5d2SYehuda Sadeh struct ceph_vino vino, 2943d14c5d2SYehuda Sadeh struct ceph_file_layout *layout, 2953d14c5d2SYehuda Sadeh u64 off, u64 *plen, 2963d14c5d2SYehuda Sadeh u32 truncate_seq, u64 truncate_size, 297b7495fc2SSage Weil struct page **pages, int nr_pages, 298b7495fc2SSage Weil int page_align); 2993d14c5d2SYehuda Sadeh 3003d14c5d2SYehuda Sadeh extern int ceph_osdc_writepages(struct ceph_osd_client *osdc, 3013d14c5d2SYehuda Sadeh struct ceph_vino vino, 3023d14c5d2SYehuda Sadeh struct ceph_file_layout *layout, 3033d14c5d2SYehuda Sadeh struct ceph_snap_context *sc, 3043d14c5d2SYehuda Sadeh u64 off, u64 len, 3053d14c5d2SYehuda Sadeh u32 truncate_seq, u64 truncate_size, 3063d14c5d2SYehuda Sadeh struct timespec *mtime, 30724808826SAlex Elder struct page **pages, int nr_pages); 3083d14c5d2SYehuda Sadeh 309a40c4f10SYehuda Sadeh /* watch/notify events */ 310a40c4f10SYehuda Sadeh extern int ceph_osdc_create_event(struct ceph_osd_client *osdc, 311a40c4f10SYehuda Sadeh void (*event_cb)(u64, u64, u8, void *), 3123c663bbdSAlex Elder void *data, struct ceph_osd_event **pevent); 313a40c4f10SYehuda Sadeh extern void ceph_osdc_cancel_event(struct ceph_osd_event *event); 314a40c4f10SYehuda Sadeh extern void ceph_osdc_put_event(struct ceph_osd_event *event); 3153d14c5d2SYehuda Sadeh #endif 3163d14c5d2SYehuda Sadeh 317