Merge branch 'next' of git://git.kernel.org/pub/scm/linux/kernel/git/rzhang/linux
[linux-2.6-block.git] / fs / ceph / ioctl.c
CommitLineData
96c57ade 1#include <linux/ceph/ceph_debug.h>
8f4e91de
SW
2#include <linux/in.h>
3
8f4e91de 4#include "super.h"
3d14c5d2 5#include "mds_client.h"
3d14c5d2 6#include "ioctl.h"
8f4e91de
SW
7
8
9/*
10 * ioctls
11 */
12
13/*
14 * get and set the file layout
15 */
16static long ceph_ioctl_get_layout(struct file *file, void __user *arg)
17{
496ad9aa 18 struct ceph_inode_info *ci = ceph_inode(file_inode(file));
8f4e91de
SW
19 struct ceph_ioctl_layout l;
20 int err;
21
508b32d8 22 err = ceph_do_getattr(file_inode(file), CEPH_STAT_CAP_LAYOUT, false);
8f4e91de 23 if (!err) {
7627151e
YZ
24 l.stripe_unit = ci->i_layout.stripe_unit;
25 l.stripe_count = ci->i_layout.stripe_count;
26 l.object_size = ci->i_layout.object_size;
27 l.data_pool = ci->i_layout.pool_id;
3469ac1a 28 l.preferred_osd = (s32)-1;
8f4e91de
SW
29 if (copy_to_user(arg, &l, sizeof(l)))
30 return -EFAULT;
31 }
32
33 return err;
34}
35
e49bf4c5
SW
36static long __validate_layout(struct ceph_mds_client *mdsc,
37 struct ceph_ioctl_layout *l)
38{
39 int i, err;
40
e49bf4c5
SW
41 /* validate striping parameters */
42 if ((l->object_size & ~PAGE_MASK) ||
43 (l->stripe_unit & ~PAGE_MASK) ||
0bc62284 44 ((unsigned)l->stripe_unit != 0 &&
45f2e081 45 ((unsigned)l->object_size % (unsigned)l->stripe_unit)))
e49bf4c5
SW
46 return -EINVAL;
47
48 /* make sure it's a valid data pool */
49 mutex_lock(&mdsc->mutex);
50 err = -EINVAL;
51 for (i = 0; i < mdsc->mdsmap->m_num_data_pg_pools; i++)
52 if (mdsc->mdsmap->m_data_pg_pools[i] == l->data_pool) {
53 err = 0;
54 break;
55 }
56 mutex_unlock(&mdsc->mutex);
57 if (err)
58 return err;
59
60 return 0;
61}
62
8f4e91de
SW
63static long ceph_ioctl_set_layout(struct file *file, void __user *arg)
64{
496ad9aa 65 struct inode *inode = file_inode(file);
3d14c5d2 66 struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc;
8f4e91de
SW
67 struct ceph_mds_request *req;
68 struct ceph_ioctl_layout l;
496ad9aa 69 struct ceph_inode_info *ci = ceph_inode(file_inode(file));
a35eca95 70 struct ceph_ioctl_layout nl;
e49bf4c5 71 int err;
8f4e91de 72
8f4e91de
SW
73 if (copy_from_user(&l, arg, sizeof(l)))
74 return -EFAULT;
75
a35eca95 76 /* validate changed params against current layout */
508b32d8 77 err = ceph_do_getattr(file_inode(file), CEPH_STAT_CAP_LAYOUT, false);
702aeb1f 78 if (err)
a35eca95
GF
79 return err;
80
702aeb1f 81 memset(&nl, 0, sizeof(nl));
a35eca95
GF
82 if (l.stripe_count)
83 nl.stripe_count = l.stripe_count;
702aeb1f 84 else
7627151e 85 nl.stripe_count = ci->i_layout.stripe_count;
a35eca95
GF
86 if (l.stripe_unit)
87 nl.stripe_unit = l.stripe_unit;
702aeb1f 88 else
7627151e 89 nl.stripe_unit = ci->i_layout.stripe_unit;
a35eca95
GF
90 if (l.object_size)
91 nl.object_size = l.object_size;
702aeb1f 92 else
7627151e 93 nl.object_size = ci->i_layout.object_size;
a35eca95
GF
94 if (l.data_pool)
95 nl.data_pool = l.data_pool;
702aeb1f 96 else
7627151e 97 nl.data_pool = ci->i_layout.pool_id;
702aeb1f
SW
98
99 /* this is obsolete, and always -1 */
100 nl.preferred_osd = le64_to_cpu(-1);
a35eca95 101
e49bf4c5
SW
102 err = __validate_layout(mdsc, &nl);
103 if (err)
104 return err;
8f4e91de
SW
105
106 req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETLAYOUT,
107 USE_AUTH_MDS);
108 if (IS_ERR(req))
109 return PTR_ERR(req);
70b666c3
SW
110 req->r_inode = inode;
111 ihold(inode);
3bd58143
YZ
112 req->r_num_caps = 1;
113
8f4e91de
SW
114 req->r_inode_drop = CEPH_CAP_FILE_SHARED | CEPH_CAP_FILE_EXCL;
115
116 req->r_args.setlayout.layout.fl_stripe_unit =
117 cpu_to_le32(l.stripe_unit);
118 req->r_args.setlayout.layout.fl_stripe_count =
119 cpu_to_le32(l.stripe_count);
120 req->r_args.setlayout.layout.fl_object_size =
121 cpu_to_le32(l.object_size);
122 req->r_args.setlayout.layout.fl_pg_pool = cpu_to_le32(l.data_pool);
8f4e91de 123
752c8bdc 124 err = ceph_mdsc_do_request(mdsc, NULL, req);
8f4e91de
SW
125 ceph_mdsc_put_request(req);
126 return err;
127}
128
571dba52
GF
129/*
130 * Set a layout policy on a directory inode. All items in the tree
131 * rooted at this inode will inherit this layout on creation,
132 * (It doesn't apply retroactively )
133 * unless a subdirectory has its own layout policy.
134 */
135static long ceph_ioctl_set_layout_policy (struct file *file, void __user *arg)
136{
496ad9aa 137 struct inode *inode = file_inode(file);
571dba52
GF
138 struct ceph_mds_request *req;
139 struct ceph_ioctl_layout l;
e49bf4c5 140 int err;
571dba52
GF
141 struct ceph_mds_client *mdsc = ceph_sb_to_client(inode->i_sb)->mdsc;
142
143 /* copy and validate */
144 if (copy_from_user(&l, arg, sizeof(l)))
145 return -EFAULT;
146
e49bf4c5
SW
147 err = __validate_layout(mdsc, &l);
148 if (err)
149 return err;
571dba52
GF
150
151 req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETDIRLAYOUT,
152 USE_AUTH_MDS);
153
154 if (IS_ERR(req))
155 return PTR_ERR(req);
70b666c3
SW
156 req->r_inode = inode;
157 ihold(inode);
3bd58143 158 req->r_num_caps = 1;
571dba52
GF
159
160 req->r_args.setlayout.layout.fl_stripe_unit =
161 cpu_to_le32(l.stripe_unit);
162 req->r_args.setlayout.layout.fl_stripe_count =
163 cpu_to_le32(l.stripe_count);
164 req->r_args.setlayout.layout.fl_object_size =
165 cpu_to_le32(l.object_size);
166 req->r_args.setlayout.layout.fl_pg_pool =
167 cpu_to_le32(l.data_pool);
571dba52
GF
168
169 err = ceph_mdsc_do_request(mdsc, inode, req);
170 ceph_mdsc_put_request(req);
171 return err;
172}
173
8f4e91de
SW
174/*
175 * Return object name, size/offset information, and location (OSD
176 * number, network address) for a given file offset.
177 */
178static long ceph_ioctl_get_dataloc(struct file *file, void __user *arg)
179{
180 struct ceph_ioctl_dataloc dl;
496ad9aa 181 struct inode *inode = file_inode(file);
8f4e91de 182 struct ceph_inode_info *ci = ceph_inode(inode);
3d14c5d2
YS
183 struct ceph_osd_client *osdc =
184 &ceph_sb_to_client(inode->i_sb)->client->osdc;
7c13cb64 185 struct ceph_object_locator oloc;
281dbe5d 186 CEPH_DEFINE_OID_ONSTACK(oid);
8f4e91de
SW
187 u64 len = 1, olen;
188 u64 tmp;
51042122 189 struct ceph_pg pgid;
457712a0 190 int r;
8f4e91de
SW
191
192 /* copy and validate */
193 if (copy_from_user(&dl, arg, sizeof(dl)))
194 return -EFAULT;
195
5aea3dcd 196 down_read(&osdc->lock);
e8afad65 197 r = ceph_calc_file_object_mapping(&ci->i_layout, dl.file_offset, len,
457712a0
SW
198 &dl.object_no, &dl.object_offset,
199 &olen);
494ddd11 200 if (r < 0) {
5aea3dcd 201 up_read(&osdc->lock);
457712a0 202 return -EIO;
494ddd11 203 }
8f4e91de 204 dl.file_offset -= dl.object_offset;
7627151e
YZ
205 dl.object_size = ci->i_layout.object_size;
206 dl.block_size = ci->i_layout.stripe_unit;
8f4e91de
SW
207
208 /* block_offset = object_offset % block_size */
209 tmp = dl.object_offset;
210 dl.block_offset = do_div(tmp, dl.block_size);
211
212 snprintf(dl.object_name, sizeof(dl.object_name), "%llx.%08llx",
213 ceph_ino(inode), dl.object_no);
41766f87 214
7627151e 215 oloc.pool = ci->i_layout.pool_id;
779fe0fb 216 oloc.pool_ns = ceph_try_get_string(ci->i_layout.pool_ns);
d30291b9 217 ceph_oid_printf(&oid, "%s", dl.object_name);
7c13cb64 218
d9591f5e 219 r = ceph_object_locator_to_pg(osdc->osdmap, &oid, &oloc, &pgid);
779fe0fb
YZ
220
221 ceph_oloc_destroy(&oloc);
2fbcbff1 222 if (r < 0) {
5aea3dcd 223 up_read(&osdc->lock);
2fbcbff1 224 return r;
225 }
8f4e91de 226
f81f1633 227 dl.osd = ceph_pg_to_acting_primary(osdc->osdmap, &pgid);
8f4e91de
SW
228 if (dl.osd >= 0) {
229 struct ceph_entity_addr *a =
230 ceph_osd_addr(osdc->osdmap, dl.osd);
231 if (a)
232 memcpy(&dl.osd_addr, &a->in_addr, sizeof(dl.osd_addr));
233 } else {
234 memset(&dl.osd_addr, 0, sizeof(dl.osd_addr));
235 }
5aea3dcd 236 up_read(&osdc->lock);
8f4e91de
SW
237
238 /* send result back to user */
239 if (copy_to_user(arg, &dl, sizeof(dl)))
240 return -EFAULT;
241
242 return 0;
243}
244
8c6e9229
SW
245static long ceph_ioctl_lazyio(struct file *file)
246{
247 struct ceph_file_info *fi = file->private_data;
496ad9aa 248 struct inode *inode = file_inode(file);
8c6e9229
SW
249 struct ceph_inode_info *ci = ceph_inode(inode);
250
251 if ((fi->fmode & CEPH_FILE_MODE_LAZY) == 0) {
be655596 252 spin_lock(&ci->i_ceph_lock);
8c6e9229 253 fi->fmode |= CEPH_FILE_MODE_LAZY;
774a6a11 254 ci->i_nr_by_mode[ffs(CEPH_FILE_MODE_LAZY)]++;
be655596 255 spin_unlock(&ci->i_ceph_lock);
8c6e9229
SW
256 dout("ioctl_layzio: file %p marked lazy\n", file);
257
258 ceph_check_caps(ci, 0, NULL);
259 } else {
260 dout("ioctl_layzio: file %p already lazy\n", file);
261 }
262 return 0;
263}
264
4918b6d1
SW
265static long ceph_ioctl_syncio(struct file *file)
266{
267 struct ceph_file_info *fi = file->private_data;
268
269 fi->flags |= CEPH_F_SYNC;
270 return 0;
271}
272
8f4e91de
SW
273long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
274{
275 dout("ioctl file %p cmd %u arg %lu\n", file, cmd, arg);
276 switch (cmd) {
277 case CEPH_IOC_GET_LAYOUT:
278 return ceph_ioctl_get_layout(file, (void __user *)arg);
279
280 case CEPH_IOC_SET_LAYOUT:
281 return ceph_ioctl_set_layout(file, (void __user *)arg);
282
571dba52
GF
283 case CEPH_IOC_SET_LAYOUT_POLICY:
284 return ceph_ioctl_set_layout_policy(file, (void __user *)arg);
285
8f4e91de
SW
286 case CEPH_IOC_GET_DATALOC:
287 return ceph_ioctl_get_dataloc(file, (void __user *)arg);
8c6e9229
SW
288
289 case CEPH_IOC_LAZYIO:
290 return ceph_ioctl_lazyio(file);
4918b6d1
SW
291
292 case CEPH_IOC_SYNCIO:
293 return ceph_ioctl_syncio(file);
8f4e91de 294 }
571dba52 295
8f4e91de
SW
296 return -ENOTTY;
297}