osd_ore.h 5.36 KB
Newer Older
1 2
/*
 * Copyright (C) 2011
3
 * Boaz Harrosh <ooo@electrozaur.com>
4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28
 *
 * Public Declarations of the ORE API
 *
 * This file is part of the ORE (Object Raid Engine) library.
 *
 * ORE is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License version 2 as published
 * by the Free Software Foundation. (GPL v2)
 *
 * ORE is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with the ORE; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
 */
#ifndef __ORE_H__
#define __ORE_H__

#include <scsi/osd_initiator.h>
#include <scsi/osd_attributes.h>
#include <scsi/osd_sec.h>
#include <linux/pnfs_osd_xdr.h>
29
#include <linux/bug.h>
30 31 32 33 34 35 36 37

struct ore_comp {
	struct osd_obj_id	obj;
	u8			cred[OSD_CAP_LEN];
};

struct ore_layout {
	/* Our way of looking at the data_map */
38 39
	enum pnfs_osd_raid_algorithm4
		 raid_algorithm;
40 41 42 43
	unsigned stripe_unit;
	unsigned mirrors_p1;

	unsigned group_width;
Boaz Harrosh's avatar
Boaz Harrosh committed
44
	unsigned parity;
45 46
	u64	 group_depth;
	unsigned group_count;
47 48 49 50 51 52 53

	/* Cached often needed calculations filled in by
	 * ore_verify_layout
	 */
	unsigned long max_io_length;	/* Max length that should be passed to
					 * ore_get_rw_state
					 */
54 55
};

56 57 58 59
struct ore_dev {
	struct osd_dev *od;
};

60
struct ore_components {
61
	unsigned	first_dev;		/* First logical device no    */
62 63 64 65 66 67 68 69
	unsigned	numdevs;		/* Num of devices in array    */
	/* If @single_comp == EC_SINGLE_COMP, @comps points to a single
	 * component. else there are @numdevs components
	 */
	enum EC_COMP_USAGE {
		EC_SINGLE_COMP = 0, EC_MULTPLE_COMPS = 0xffffffff
	}		single_comp;
	struct ore_comp	*comps;
70 71 72 73 74 75 76

	/* Array of pointers to ore_dev-* . User will usually have these pointed
	 * too a bigger struct which contain an "ore_dev ored" member and use
	 * container_of(oc->ods[i], struct foo_dev, ored) to access the bigger
	 * structure.
	 */
	struct ore_dev	**ods;
77 78
};

79 80 81 82
/* ore_comp_dev Recievies a logical device index */
static inline struct osd_dev *ore_comp_dev(
	const struct ore_components *oc, unsigned i)
{
83 84
	BUG_ON((i < oc->first_dev) || (oc->first_dev + oc->numdevs <= i));
	return oc->ods[i - oc->first_dev]->od;
85 86 87 88 89
}

static inline void ore_comp_set_dev(
	struct ore_components *oc, unsigned i, struct osd_dev *od)
{
90
	oc->ods[i - oc->first_dev]->od = od;
91 92
}

93
struct ore_striping_info {
Boaz Harrosh's avatar
Boaz Harrosh committed
94
	u64 offset;
95
	u64 obj_offset;
Boaz Harrosh's avatar
Boaz Harrosh committed
96 97
	u64 length;
	u64 first_stripe_start; /* only used in raid writes */
98
	u64 M; /* for truncate */
Boaz Harrosh's avatar
Boaz Harrosh committed
99
	unsigned bytes_in_stripe;
100
	unsigned dev;
Boaz Harrosh's avatar
Boaz Harrosh committed
101
	unsigned par_dev;
102
	unsigned unit_off;
Boaz Harrosh's avatar
Boaz Harrosh committed
103
	unsigned cur_pg;
Boaz Harrosh's avatar
Boaz Harrosh committed
104
	unsigned cur_comp;
105
	unsigned maxdevUnits;
106 107
};

108 109
struct ore_io_state;
typedef void (*ore_io_done_fn)(struct ore_io_state *ios, void *private);
Boaz Harrosh's avatar
Boaz Harrosh committed
110 111 112 113 114
struct _ore_r4w_op {
	/* @Priv given here is passed ios->private */
	struct page * (*get_page)(void *priv, u64 page_index, bool *uptodate);
	void (*put_page)(void *priv, struct page *page);
};
115 116 117

struct ore_io_state {
	struct kref		kref;
118
	struct ore_striping_info si;
119 120 121 122 123

	void			*private;
	ore_io_done_fn	done;

	struct ore_layout	*layout;
124
	struct ore_components	*oc;
125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143

	/* Global read/write IO*/
	loff_t			offset;
	unsigned long		length;
	void			*kern_buff;

	struct page		**pages;
	unsigned		nr_pages;
	unsigned		pgbase;
	unsigned		pages_consumed;

	/* Attributes */
	unsigned		in_attr_len;
	struct osd_attr		*in_attr;
	unsigned		out_attr_len;
	struct osd_attr		*out_attr;

	bool			reading;

Boaz Harrosh's avatar
Boaz Harrosh committed
144 145 146 147 148 149
	/* House keeping of Parity pages */
	bool			extra_part_alloc;
	struct page		**parity_pages;
	unsigned		max_par_pages;
	unsigned		cur_par_page;
	unsigned		sgs_per_dev;
Boaz Harrosh's avatar
Boaz Harrosh committed
150 151 152
	struct __stripe_pages_2d *sp2d;
	struct ore_io_state	 *ios_read_4_write;
	const struct _ore_r4w_op *r4w;
Boaz Harrosh's avatar
Boaz Harrosh committed
153

154 155 156 157 158 159 160
	/* Variable array of size numdevs */
	unsigned numdevs;
	struct ore_per_dev_state {
		struct osd_request *or;
		struct bio *bio;
		loff_t offset;
		unsigned length;
Boaz Harrosh's avatar
Boaz Harrosh committed
161
		unsigned last_sgs_total;
162
		unsigned dev;
Boaz Harrosh's avatar
Boaz Harrosh committed
163 164
		struct osd_sg_entry *sglist;
		unsigned cur_sg;
165 166 167 168 169 170 171 172 173 174
	} per_dev[];
};

static inline unsigned ore_io_state_size(unsigned numdevs)
{
	return sizeof(struct ore_io_state) +
		sizeof(struct ore_per_dev_state) * numdevs;
}

/* ore.c */
175
int ore_verify_layout(unsigned total_comps, struct ore_layout *layout);
176
void ore_calc_stripe_info(struct ore_layout *layout, u64 file_offset,
Boaz Harrosh's avatar
Boaz Harrosh committed
177
			  u64 length, struct ore_striping_info *si);
178 179 180 181 182 183 184
int ore_get_rw_state(struct ore_layout *layout, struct ore_components *comps,
		     bool is_reading, u64 offset, u64 length,
		     struct ore_io_state **ios);
int ore_get_io_state(struct ore_layout *layout, struct ore_components *comps,
		     struct ore_io_state **ios);
void ore_put_io_state(struct ore_io_state *ios);

185 186 187 188
typedef void (*ore_on_dev_error)(struct ore_io_state *ios, struct ore_dev *od,
	unsigned dev_index, enum osd_err_priority oep,
	u64 dev_offset, u64  dev_len);
int ore_check_io(struct ore_io_state *ios, ore_on_dev_error rep);
189 190 191 192 193 194 195 196 197 198 199 200 201

int ore_create(struct ore_io_state *ios);
int ore_remove(struct ore_io_state *ios);
int ore_write(struct ore_io_state *ios);
int ore_read(struct ore_io_state *ios);
int ore_truncate(struct ore_layout *layout, struct ore_components *comps,
		 u64 size);

int extract_attr_from_ios(struct ore_io_state *ios, struct osd_attr *attr);

extern const struct osd_attr g_attr_logical_length;

#endif