2009-10-07 01:31:10 +07:00
|
|
|
#ifndef _FS_CEPH_OSD_CLIENT_H
|
|
|
|
#define _FS_CEPH_OSD_CLIENT_H
|
|
|
|
|
|
|
|
#include <linux/completion.h>
|
2009-12-08 04:37:03 +07:00
|
|
|
#include <linux/kref.h>
|
2009-10-07 01:31:10 +07:00
|
|
|
#include <linux/mempool.h>
|
|
|
|
#include <linux/rbtree.h>
|
|
|
|
|
2012-05-17 03:16:38 +07:00
|
|
|
#include <linux/ceph/types.h>
|
|
|
|
#include <linux/ceph/osdmap.h>
|
|
|
|
#include <linux/ceph/messenger.h>
|
|
|
|
#include <linux/ceph/auth.h>
|
2012-11-14 10:11:15 +07:00
|
|
|
#include <linux/ceph/pagelist.h>
|
2009-10-07 01:31:10 +07:00
|
|
|
|
2011-11-10 20:45:37 +07:00
|
|
|
/*
|
|
|
|
* Maximum object name size
|
|
|
|
* (must be at least as big as RBD_MAX_MD_NAME_LEN -- currently 100)
|
|
|
|
*/
|
|
|
|
#define MAX_OBJ_NAME_SIZE 100
|
|
|
|
|
2009-10-07 01:31:10 +07:00
|
|
|
struct ceph_msg;
|
|
|
|
struct ceph_snap_context;
|
|
|
|
struct ceph_osd_request;
|
|
|
|
struct ceph_osd_client;
|
2009-11-19 07:19:57 +07:00
|
|
|
struct ceph_authorizer;
|
2009-10-07 01:31:10 +07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* completion callback for async writepages
|
|
|
|
*/
|
|
|
|
typedef void (*ceph_osdc_callback_t)(struct ceph_osd_request *,
|
|
|
|
struct ceph_msg *);
|
|
|
|
|
|
|
|
/* a given osd we're communicating with */
|
|
|
|
struct ceph_osd {
|
|
|
|
atomic_t o_ref;
|
|
|
|
struct ceph_osd_client *o_osdc;
|
|
|
|
int o_osd;
|
|
|
|
int o_incarnation;
|
|
|
|
struct rb_node o_node;
|
|
|
|
struct ceph_connection o_con;
|
|
|
|
struct list_head o_requests;
|
2011-03-22 05:07:16 +07:00
|
|
|
struct list_head o_linger_requests;
|
2010-02-04 02:00:26 +07:00
|
|
|
struct list_head o_osd_lru;
|
2012-05-17 03:16:38 +07:00
|
|
|
struct ceph_auth_handshake o_auth;
|
2010-02-04 02:00:26 +07:00
|
|
|
unsigned long lru_ttl;
|
2010-02-27 06:32:31 +07:00
|
|
|
int o_marked_for_keepalive;
|
|
|
|
struct list_head o_keepalive_item;
|
2009-10-07 01:31:10 +07:00
|
|
|
};
|
|
|
|
|
2013-02-26 07:11:12 +07:00
|
|
|
|
|
|
|
#define CEPH_OSD_MAX_OP 10
|
|
|
|
|
2013-02-15 01:16:43 +07:00
|
|
|
enum ceph_osd_data_type {
|
|
|
|
CEPH_OSD_DATA_TYPE_NONE,
|
|
|
|
CEPH_OSD_DATA_TYPE_PAGES,
|
2013-03-09 02:35:36 +07:00
|
|
|
CEPH_OSD_DATA_TYPE_PAGELIST,
|
2013-02-15 01:16:43 +07:00
|
|
|
#ifdef CONFIG_BLOCK
|
|
|
|
CEPH_OSD_DATA_TYPE_BIO,
|
|
|
|
#endif /* CONFIG_BLOCK */
|
|
|
|
};
|
|
|
|
|
2013-02-15 01:16:43 +07:00
|
|
|
struct ceph_osd_data {
|
2013-02-15 01:16:43 +07:00
|
|
|
enum ceph_osd_data_type type;
|
|
|
|
union {
|
2013-02-15 01:16:43 +07:00
|
|
|
struct {
|
|
|
|
struct page **pages;
|
2013-03-08 04:38:25 +07:00
|
|
|
u64 length;
|
2013-02-15 01:16:43 +07:00
|
|
|
u32 alignment;
|
|
|
|
bool pages_from_pool;
|
|
|
|
bool own_pages;
|
|
|
|
};
|
2013-03-09 02:35:36 +07:00
|
|
|
struct ceph_pagelist *pagelist;
|
2013-02-15 01:16:43 +07:00
|
|
|
#ifdef CONFIG_BLOCK
|
2013-03-15 02:09:06 +07:00
|
|
|
struct {
|
|
|
|
struct bio *bio; /* list of bios */
|
|
|
|
size_t bio_length; /* total in list */
|
|
|
|
};
|
2013-02-15 01:16:43 +07:00
|
|
|
#endif /* CONFIG_BLOCK */
|
|
|
|
};
|
|
|
|
};
|
|
|
|
|
2009-10-07 01:31:10 +07:00
|
|
|
/* an in-flight request */
|
|
|
|
struct ceph_osd_request {
|
|
|
|
u64 r_tid; /* unique for this client */
|
|
|
|
struct rb_node r_node;
|
2010-02-27 06:32:31 +07:00
|
|
|
struct list_head r_req_lru_item;
|
2009-10-07 01:31:10 +07:00
|
|
|
struct list_head r_osd_item;
|
2011-03-22 05:07:16 +07:00
|
|
|
struct list_head r_linger_item;
|
|
|
|
struct list_head r_linger_osd;
|
2009-10-07 01:31:10 +07:00
|
|
|
struct ceph_osd *r_osd;
|
2013-02-24 01:38:16 +07:00
|
|
|
struct ceph_pg r_pgid;
|
2010-05-11 00:24:48 +07:00
|
|
|
int r_pg_osds[CEPH_PG_MAX_SIZE];
|
|
|
|
int r_num_pg_osds;
|
2009-10-07 01:31:10 +07:00
|
|
|
|
|
|
|
struct ceph_msg *r_request, *r_reply;
|
|
|
|
int r_flags; /* any additional flags for the osd */
|
|
|
|
u32 r_sent; /* >0 if r_request is sending/sent */
|
2013-02-26 07:11:12 +07:00
|
|
|
int r_num_ops;
|
|
|
|
|
|
|
|
/* encoded message content */
|
|
|
|
struct ceph_osd_op *r_request_ops;
|
|
|
|
/* these are updated on each send */
|
|
|
|
__le32 *r_request_osdmap_epoch;
|
|
|
|
__le32 *r_request_flags;
|
|
|
|
__le64 *r_request_pool;
|
|
|
|
void *r_request_pgid;
|
|
|
|
__le32 *r_request_attempts;
|
|
|
|
struct ceph_eversion *r_request_reassert_version;
|
|
|
|
|
|
|
|
int r_result;
|
|
|
|
int r_reply_op_len[CEPH_OSD_MAX_OP];
|
|
|
|
s32 r_reply_op_result[CEPH_OSD_MAX_OP];
|
2009-12-23 01:45:45 +07:00
|
|
|
int r_got_reply;
|
2011-03-22 05:07:16 +07:00
|
|
|
int r_linger;
|
2013-02-27 23:26:25 +07:00
|
|
|
int r_completed;
|
2009-10-07 01:31:10 +07:00
|
|
|
|
|
|
|
struct ceph_osd_client *r_osdc;
|
2009-12-08 04:37:03 +07:00
|
|
|
struct kref r_kref;
|
2009-10-07 01:31:10 +07:00
|
|
|
bool r_mempool;
|
|
|
|
struct completion r_completion, r_safe_completion;
|
|
|
|
ceph_osdc_callback_t r_callback, r_safe_callback;
|
|
|
|
struct ceph_eversion r_reassert_version;
|
|
|
|
struct list_head r_unsafe_item;
|
|
|
|
|
|
|
|
struct inode *r_inode; /* for use by callbacks */
|
2010-04-07 05:14:15 +07:00
|
|
|
void *r_priv; /* ditto */
|
2009-10-07 01:31:10 +07:00
|
|
|
|
2011-11-10 20:45:37 +07:00
|
|
|
char r_oid[MAX_OBJ_NAME_SIZE]; /* object name */
|
2009-10-07 01:31:10 +07:00
|
|
|
int r_oid_len;
|
2013-02-26 07:13:08 +07:00
|
|
|
u64 r_snapid;
|
2010-03-23 04:42:30 +07:00
|
|
|
unsigned long r_stamp; /* send OR check time */
|
2009-10-07 01:31:10 +07:00
|
|
|
|
|
|
|
struct ceph_file_layout r_file_layout;
|
|
|
|
struct ceph_snap_context *r_snapc; /* snap context for writes */
|
2010-04-07 05:01:27 +07:00
|
|
|
|
2013-02-15 01:16:43 +07:00
|
|
|
struct ceph_osd_data r_data_in;
|
|
|
|
struct ceph_osd_data r_data_out;
|
2009-10-07 01:31:10 +07:00
|
|
|
};
|
|
|
|
|
2011-03-22 05:07:16 +07:00
|
|
|
struct ceph_osd_event {
|
|
|
|
u64 cookie;
|
|
|
|
int one_shot;
|
|
|
|
struct ceph_osd_client *osdc;
|
|
|
|
void (*cb)(u64, u64, u8, void *);
|
|
|
|
void *data;
|
|
|
|
struct rb_node node;
|
|
|
|
struct list_head osd_node;
|
|
|
|
struct kref kref;
|
|
|
|
};
|
|
|
|
|
|
|
|
struct ceph_osd_event_work {
|
|
|
|
struct work_struct work;
|
|
|
|
struct ceph_osd_event *event;
|
|
|
|
u64 ver;
|
|
|
|
u64 notify_id;
|
|
|
|
u8 opcode;
|
|
|
|
};
|
|
|
|
|
2009-10-07 01:31:10 +07:00
|
|
|
struct ceph_osd_client {
|
|
|
|
struct ceph_client *client;
|
|
|
|
|
|
|
|
struct ceph_osdmap *osdmap; /* current map */
|
|
|
|
struct rw_semaphore map_sem;
|
|
|
|
struct completion map_waiters;
|
|
|
|
u64 last_requested_map;
|
|
|
|
|
|
|
|
struct mutex request_mutex;
|
|
|
|
struct rb_root osds; /* osds */
|
2010-02-04 02:00:26 +07:00
|
|
|
struct list_head osd_lru; /* idle osds */
|
2009-10-07 01:31:10 +07:00
|
|
|
u64 timeout_tid; /* tid of timeout triggering rq */
|
|
|
|
u64 last_tid; /* tid of last request */
|
|
|
|
struct rb_root requests; /* pending requests */
|
2011-01-18 11:34:08 +07:00
|
|
|
struct list_head req_lru; /* in-flight lru */
|
|
|
|
struct list_head req_unsent; /* unsent/need-resend queue */
|
|
|
|
struct list_head req_notarget; /* map to no osd */
|
2011-03-22 05:07:16 +07:00
|
|
|
struct list_head req_linger; /* lingering requests */
|
2009-10-07 01:31:10 +07:00
|
|
|
int num_requests;
|
|
|
|
struct delayed_work timeout_work;
|
2010-02-04 02:00:26 +07:00
|
|
|
struct delayed_work osds_timeout_work;
|
2009-11-13 06:05:52 +07:00
|
|
|
#ifdef CONFIG_DEBUG_FS
|
2009-10-07 01:31:10 +07:00
|
|
|
struct dentry *debugfs_file;
|
2009-11-13 06:05:52 +07:00
|
|
|
#endif
|
2009-10-07 01:31:10 +07:00
|
|
|
|
|
|
|
mempool_t *req_mempool;
|
|
|
|
|
2010-01-14 08:03:23 +07:00
|
|
|
struct ceph_msgpool msgpool_op;
|
2010-03-02 04:02:00 +07:00
|
|
|
struct ceph_msgpool msgpool_op_reply;
|
2011-03-22 05:07:16 +07:00
|
|
|
|
|
|
|
spinlock_t event_lock;
|
|
|
|
struct rb_root event_tree;
|
|
|
|
u64 event_count;
|
|
|
|
|
|
|
|
struct workqueue_struct *notify_wq;
|
2009-10-07 01:31:10 +07:00
|
|
|
};
|
|
|
|
|
2010-04-07 05:01:27 +07:00
|
|
|
struct ceph_osd_req_op {
|
|
|
|
u16 op; /* CEPH_OSD_OP_* */
|
2013-02-15 01:16:43 +07:00
|
|
|
u32 payload_len;
|
2010-04-07 05:01:27 +07:00
|
|
|
union {
|
|
|
|
struct {
|
|
|
|
u64 offset, length;
|
|
|
|
u64 truncate_size;
|
|
|
|
u32 truncate_seq;
|
|
|
|
} extent;
|
|
|
|
struct {
|
2010-05-19 06:38:08 +07:00
|
|
|
const char *class_name;
|
|
|
|
const char *method_name;
|
2013-03-02 07:00:15 +07:00
|
|
|
const void *indata;
|
2010-04-07 05:01:27 +07:00
|
|
|
u32 indata_len;
|
2013-02-15 01:16:43 +07:00
|
|
|
__u8 class_len;
|
|
|
|
__u8 method_len;
|
|
|
|
__u8 argc;
|
2010-04-07 05:01:27 +07:00
|
|
|
} cls;
|
2011-03-22 05:07:16 +07:00
|
|
|
struct {
|
|
|
|
u64 cookie;
|
|
|
|
u64 ver;
|
|
|
|
u32 prot_ver;
|
|
|
|
u32 timeout;
|
2013-02-15 01:16:43 +07:00
|
|
|
__u8 flag;
|
2011-03-22 05:07:16 +07:00
|
|
|
} watch;
|
2010-04-07 05:01:27 +07:00
|
|
|
};
|
|
|
|
};
|
|
|
|
|
2009-10-07 01:31:10 +07:00
|
|
|
extern int ceph_osdc_init(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_client *client);
|
|
|
|
extern void ceph_osdc_stop(struct ceph_osd_client *osdc);
|
|
|
|
|
|
|
|
extern void ceph_osdc_handle_reply(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_msg *msg);
|
|
|
|
extern void ceph_osdc_handle_map(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_msg *msg);
|
|
|
|
|
libceph: define source request op functions
The rbd code has a function that allocates and populates a
ceph_osd_req_op structure (the in-core version of an osd request
operation). When reviewed, Josh suggested two things: that the
big varargs function might be better split into type-specific
functions; and that this functionality really belongs in the osd
client rather than rbd.
This patch implements both of Josh's suggestions. It breaks
up the rbd function into separate functions and defines them
in the osd client module as exported interfaces. Unlike the
rbd version, however, the functions don't allocate an osd_req_op
structure; they are provided the address of one and that is
initialized instead.
The rbd function has been eliminated and calls to it have been
replaced by calls to the new routines. The rbd code now now use a
stack (struct) variable to hold the op rather than allocating and
freeing it each time.
For now only the capabilities used by rbd are implemented.
Implementing all the other osd op types, and making the rest of the
code use it will be done separately, in the next few patches.
Note that only the extent, cls, and watch portions of the
ceph_osd_req_op structure are currently used. Delete the others
(xattr, pgls, and snap) from its definition so nobody thinks it's
actually implemented or needed. We can add it back again later
if needed, when we know it's been tested.
This (and a few follow-on patches) resolves:
http://tracker.ceph.com/issues/3861
Signed-off-by: Alex Elder <elder@inktank.com>
Reviewed-by: Josh Durgin <josh.durgin@inktank.com>
2013-03-14 08:50:00 +07:00
|
|
|
extern void osd_req_op_init(struct ceph_osd_req_op *op, u16 opcode);
|
|
|
|
extern void osd_req_op_extent_init(struct ceph_osd_req_op *op, u16 opcode,
|
|
|
|
u64 offset, u64 length,
|
|
|
|
u64 truncate_size, u32 truncate_seq);
|
|
|
|
extern void osd_req_op_cls_init(struct ceph_osd_req_op *op, u16 opcode,
|
|
|
|
const char *class, const char *method,
|
|
|
|
const void *request_data,
|
|
|
|
size_t request_data_size);
|
|
|
|
extern void osd_req_op_watch_init(struct ceph_osd_req_op *op, u16 opcode,
|
|
|
|
u64 cookie, u64 version, int flag);
|
|
|
|
|
2010-04-07 04:51:47 +07:00
|
|
|
extern struct ceph_osd_request *ceph_osdc_alloc_request(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_snap_context *snapc,
|
2013-03-15 02:09:05 +07:00
|
|
|
unsigned int num_ops,
|
2010-04-07 04:51:47 +07:00
|
|
|
bool use_mempool,
|
2012-11-14 10:11:15 +07:00
|
|
|
gfp_t gfp_flags);
|
2010-04-07 04:51:47 +07:00
|
|
|
|
2013-03-09 02:35:36 +07:00
|
|
|
extern void ceph_osdc_build_request(struct ceph_osd_request *req, u64 off,
|
2013-03-15 02:09:05 +07:00
|
|
|
unsigned int num_ops,
|
2010-04-07 05:01:27 +07:00
|
|
|
struct ceph_osd_req_op *src_ops,
|
|
|
|
struct ceph_snap_context *snapc,
|
2012-11-14 10:11:15 +07:00
|
|
|
u64 snap_id,
|
2012-11-09 21:43:15 +07:00
|
|
|
struct timespec *mtime);
|
2010-04-07 04:51:47 +07:00
|
|
|
|
2009-10-07 01:31:10 +07:00
|
|
|
extern struct ceph_osd_request *ceph_osdc_new_request(struct ceph_osd_client *,
|
|
|
|
struct ceph_file_layout *layout,
|
|
|
|
struct ceph_vino vino,
|
2013-03-15 02:09:05 +07:00
|
|
|
u64 offset, u64 *len,
|
|
|
|
int num_ops, struct ceph_osd_req_op *ops,
|
|
|
|
int opcode, int flags,
|
2009-10-07 01:31:10 +07:00
|
|
|
struct ceph_snap_context *snapc,
|
2013-03-15 02:09:05 +07:00
|
|
|
u32 truncate_seq, u64 truncate_size,
|
libceph: don't assign page info in ceph_osdc_new_request()
Currently ceph_osdc_new_request() assigns an osd request's
r_num_pages and r_alignment fields. The only thing it does
after that is call ceph_osdc_build_request(), and that doesn't
need those fields to be assigned.
Move the assignment of those fields out of ceph_osdc_new_request()
and into its caller. As a result, the page_align parameter is no
longer used, so get rid of it.
Note that in ceph_sync_write(), the value for req->r_num_pages had
already been calculated earlier (as num_pages, and fortunately
it was computed the same way). So don't bother recomputing it,
but because it's not needed earlier, move that calculation after the
call to ceph_osdc_new_request(). Hold off making the assignment to
r_alignment, doing it instead r_pages and r_num_pages are
getting set.
Similarly, in start_read(), nr_pages already holds the number of
pages in the array (and is calculated the same way), so there's no
need to recompute it. Move the assignment of the page alignment
down with the others there as well.
This and the next few patches are preparation work for:
http://tracker.ceph.com/issues/4127
Signed-off-by: Alex Elder <elder@inktank.com>
Reviewed-by: Josh Durgin <josh.durgin@inktank.com>
2013-03-02 07:00:15 +07:00
|
|
|
bool use_mempool);
|
2009-10-07 01:31:10 +07:00
|
|
|
|
2011-03-22 05:07:16 +07:00
|
|
|
extern void ceph_osdc_set_request_linger(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_osd_request *req);
|
|
|
|
extern void ceph_osdc_unregister_linger_request(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_osd_request *req);
|
|
|
|
|
2009-10-07 01:31:10 +07:00
|
|
|
static inline void ceph_osdc_get_request(struct ceph_osd_request *req)
|
|
|
|
{
|
2009-12-08 04:37:03 +07:00
|
|
|
kref_get(&req->r_kref);
|
|
|
|
}
|
|
|
|
extern void ceph_osdc_release_request(struct kref *kref);
|
|
|
|
static inline void ceph_osdc_put_request(struct ceph_osd_request *req)
|
|
|
|
{
|
|
|
|
kref_put(&req->r_kref, ceph_osdc_release_request);
|
2009-10-07 01:31:10 +07:00
|
|
|
}
|
|
|
|
|
|
|
|
extern int ceph_osdc_start_request(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_osd_request *req,
|
|
|
|
bool nofail);
|
|
|
|
extern int ceph_osdc_wait_request(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_osd_request *req);
|
|
|
|
extern void ceph_osdc_sync(struct ceph_osd_client *osdc);
|
|
|
|
|
|
|
|
extern int ceph_osdc_readpages(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_vino vino,
|
|
|
|
struct ceph_file_layout *layout,
|
|
|
|
u64 off, u64 *plen,
|
|
|
|
u32 truncate_seq, u64 truncate_size,
|
2010-11-10 03:43:12 +07:00
|
|
|
struct page **pages, int nr_pages,
|
|
|
|
int page_align);
|
2009-10-07 01:31:10 +07:00
|
|
|
|
|
|
|
extern int ceph_osdc_writepages(struct ceph_osd_client *osdc,
|
|
|
|
struct ceph_vino vino,
|
|
|
|
struct ceph_file_layout *layout,
|
|
|
|
struct ceph_snap_context *sc,
|
|
|
|
u64 off, u64 len,
|
|
|
|
u32 truncate_seq, u64 truncate_size,
|
|
|
|
struct timespec *mtime,
|
2013-02-16 00:42:29 +07:00
|
|
|
struct page **pages, int nr_pages);
|
2009-10-07 01:31:10 +07:00
|
|
|
|
2011-03-22 05:07:16 +07:00
|
|
|
/* watch/notify events */
|
|
|
|
extern int ceph_osdc_create_event(struct ceph_osd_client *osdc,
|
|
|
|
void (*event_cb)(u64, u64, u8, void *),
|
2013-02-16 00:42:30 +07:00
|
|
|
void *data, struct ceph_osd_event **pevent);
|
2011-03-22 05:07:16 +07:00
|
|
|
extern void ceph_osdc_cancel_event(struct ceph_osd_event *event);
|
|
|
|
extern void ceph_osdc_put_event(struct ceph_osd_event *event);
|
2009-10-07 01:31:10 +07:00
|
|
|
#endif
|
|
|
|
|