| 1 | // SPDX-License-Identifier: GPL-2.0 |
| 2 | #include <linux/ceph/ceph_debug.h> |
| 3 | #include <linux/in.h> |
| 4 | |
| 5 | #include "super.h" |
| 6 | #include "mds_client.h" |
| 7 | #include "ioctl.h" |
| 8 | #include <linux/ceph/striper.h> |
| 9 | #include <linux/fscrypt.h> |
| 10 | |
| 11 | /* |
| 12 | * ioctls |
| 13 | */ |
| 14 | |
| 15 | /* |
| 16 | * get and set the file layout |
| 17 | */ |
| 18 | static long ceph_ioctl_get_layout(struct file *file, void __user *arg) |
| 19 | { |
| 20 | struct ceph_inode_info *ci = ceph_inode(file_inode(file)); |
| 21 | struct ceph_ioctl_layout l; |
| 22 | int err; |
| 23 | |
| 24 | err = ceph_do_getattr(file_inode(file), CEPH_STAT_CAP_LAYOUT, false); |
| 25 | if (!err) { |
| 26 | l.stripe_unit = ci->i_layout.stripe_unit; |
| 27 | l.stripe_count = ci->i_layout.stripe_count; |
| 28 | l.object_size = ci->i_layout.object_size; |
| 29 | l.data_pool = ci->i_layout.pool_id; |
| 30 | l.preferred_osd = -1; |
| 31 | if (copy_to_user(arg, &l, sizeof(l))) |
| 32 | return -EFAULT; |
| 33 | } |
| 34 | |
| 35 | return err; |
| 36 | } |
| 37 | |
| 38 | static long __validate_layout(struct ceph_mds_client *mdsc, |
| 39 | struct ceph_ioctl_layout *l) |
| 40 | { |
| 41 | int i, err; |
| 42 | |
| 43 | /* validate striping parameters */ |
| 44 | if ((l->object_size & ~PAGE_MASK) || |
| 45 | (l->stripe_unit & ~PAGE_MASK) || |
| 46 | ((unsigned)l->stripe_unit != 0 && |
| 47 | ((unsigned)l->object_size % (unsigned)l->stripe_unit))) |
| 48 | return -EINVAL; |
| 49 | |
| 50 | /* make sure it's a valid data pool */ |
| 51 | mutex_lock(&mdsc->mutex); |
| 52 | err = -EINVAL; |
| 53 | for (i = 0; i < mdsc->mdsmap->m_num_data_pg_pools; i++) |
| 54 | if (mdsc->mdsmap->m_data_pg_pools[i] == l->data_pool) { |
| 55 | err = 0; |
| 56 | break; |
| 57 | } |
| 58 | mutex_unlock(&mdsc->mutex); |
| 59 | if (err) |
| 60 | return err; |
| 61 | |
| 62 | return 0; |
| 63 | } |
| 64 | |
| 65 | static long ceph_ioctl_set_layout(struct file *file, void __user *arg) |
| 66 | { |
| 67 | struct inode *inode = file_inode(file); |
| 68 | struct ceph_mds_client *mdsc = ceph_sb_to_fs_client(inode->i_sb)->mdsc; |
| 69 | struct ceph_mds_request *req; |
| 70 | struct ceph_ioctl_layout l; |
| 71 | struct ceph_inode_info *ci = ceph_inode(file_inode(file)); |
| 72 | struct ceph_ioctl_layout nl; |
| 73 | int err; |
| 74 | |
| 75 | if (copy_from_user(&l, arg, sizeof(l))) |
| 76 | return -EFAULT; |
| 77 | |
| 78 | /* validate changed params against current layout */ |
| 79 | err = ceph_do_getattr(file_inode(file), CEPH_STAT_CAP_LAYOUT, false); |
| 80 | if (err) |
| 81 | return err; |
| 82 | |
| 83 | memset(&nl, 0, sizeof(nl)); |
| 84 | if (l.stripe_count) |
| 85 | nl.stripe_count = l.stripe_count; |
| 86 | else |
| 87 | nl.stripe_count = ci->i_layout.stripe_count; |
| 88 | if (l.stripe_unit) |
| 89 | nl.stripe_unit = l.stripe_unit; |
| 90 | else |
| 91 | nl.stripe_unit = ci->i_layout.stripe_unit; |
| 92 | if (l.object_size) |
| 93 | nl.object_size = l.object_size; |
| 94 | else |
| 95 | nl.object_size = ci->i_layout.object_size; |
| 96 | if (l.data_pool) |
| 97 | nl.data_pool = l.data_pool; |
| 98 | else |
| 99 | nl.data_pool = ci->i_layout.pool_id; |
| 100 | |
| 101 | /* this is obsolete, and always -1 */ |
| 102 | nl.preferred_osd = -1; |
| 103 | |
| 104 | err = __validate_layout(mdsc, &nl); |
| 105 | if (err) |
| 106 | return err; |
| 107 | |
| 108 | req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETLAYOUT, |
| 109 | USE_AUTH_MDS); |
| 110 | if (IS_ERR(req)) |
| 111 | return PTR_ERR(req); |
| 112 | req->r_inode = inode; |
| 113 | ihold(inode); |
| 114 | req->r_num_caps = 1; |
| 115 | |
| 116 | req->r_inode_drop = CEPH_CAP_FILE_SHARED | CEPH_CAP_FILE_EXCL; |
| 117 | |
| 118 | req->r_args.setlayout.layout.fl_stripe_unit = |
| 119 | cpu_to_le32(l.stripe_unit); |
| 120 | req->r_args.setlayout.layout.fl_stripe_count = |
| 121 | cpu_to_le32(l.stripe_count); |
| 122 | req->r_args.setlayout.layout.fl_object_size = |
| 123 | cpu_to_le32(l.object_size); |
| 124 | req->r_args.setlayout.layout.fl_pg_pool = cpu_to_le32(l.data_pool); |
| 125 | |
| 126 | err = ceph_mdsc_do_request(mdsc, NULL, req); |
| 127 | ceph_mdsc_put_request(req); |
| 128 | return err; |
| 129 | } |
| 130 | |
| 131 | /* |
| 132 | * Set a layout policy on a directory inode. All items in the tree |
| 133 | * rooted at this inode will inherit this layout on creation, |
| 134 | * (It doesn't apply retroactively ) |
| 135 | * unless a subdirectory has its own layout policy. |
| 136 | */ |
| 137 | static long ceph_ioctl_set_layout_policy (struct file *file, void __user *arg) |
| 138 | { |
| 139 | struct inode *inode = file_inode(file); |
| 140 | struct ceph_mds_request *req; |
| 141 | struct ceph_ioctl_layout l; |
| 142 | int err; |
| 143 | struct ceph_mds_client *mdsc = ceph_sb_to_fs_client(inode->i_sb)->mdsc; |
| 144 | |
| 145 | /* copy and validate */ |
| 146 | if (copy_from_user(&l, arg, sizeof(l))) |
| 147 | return -EFAULT; |
| 148 | |
| 149 | err = __validate_layout(mdsc, &l); |
| 150 | if (err) |
| 151 | return err; |
| 152 | |
| 153 | req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_SETDIRLAYOUT, |
| 154 | USE_AUTH_MDS); |
| 155 | |
| 156 | if (IS_ERR(req)) |
| 157 | return PTR_ERR(req); |
| 158 | req->r_inode = inode; |
| 159 | ihold(inode); |
| 160 | req->r_num_caps = 1; |
| 161 | |
| 162 | req->r_args.setlayout.layout.fl_stripe_unit = |
| 163 | cpu_to_le32(l.stripe_unit); |
| 164 | req->r_args.setlayout.layout.fl_stripe_count = |
| 165 | cpu_to_le32(l.stripe_count); |
| 166 | req->r_args.setlayout.layout.fl_object_size = |
| 167 | cpu_to_le32(l.object_size); |
| 168 | req->r_args.setlayout.layout.fl_pg_pool = |
| 169 | cpu_to_le32(l.data_pool); |
| 170 | |
| 171 | err = ceph_mdsc_do_request(mdsc, inode, req); |
| 172 | ceph_mdsc_put_request(req); |
| 173 | return err; |
| 174 | } |
| 175 | |
| 176 | /* |
| 177 | * Return object name, size/offset information, and location (OSD |
| 178 | * number, network address) for a given file offset. |
| 179 | */ |
| 180 | static long ceph_ioctl_get_dataloc(struct file *file, void __user *arg) |
| 181 | { |
| 182 | struct ceph_ioctl_dataloc dl; |
| 183 | struct inode *inode = file_inode(file); |
| 184 | struct ceph_inode_info *ci = ceph_inode(inode); |
| 185 | struct ceph_osd_client *osdc = |
| 186 | &ceph_sb_to_fs_client(inode->i_sb)->client->osdc; |
| 187 | struct ceph_object_locator oloc; |
| 188 | CEPH_DEFINE_OID_ONSTACK(oid); |
| 189 | u32 xlen; |
| 190 | u64 tmp; |
| 191 | struct ceph_pg pgid; |
| 192 | int r; |
| 193 | |
| 194 | /* copy and validate */ |
| 195 | if (copy_from_user(&dl, arg, sizeof(dl))) |
| 196 | return -EFAULT; |
| 197 | |
| 198 | down_read(&osdc->lock); |
| 199 | ceph_calc_file_object_mapping(&ci->i_layout, dl.file_offset, 1, |
| 200 | &dl.object_no, &dl.object_offset, &xlen); |
| 201 | dl.file_offset -= dl.object_offset; |
| 202 | dl.object_size = ci->i_layout.object_size; |
| 203 | dl.block_size = ci->i_layout.stripe_unit; |
| 204 | |
| 205 | /* block_offset = object_offset % block_size */ |
| 206 | tmp = dl.object_offset; |
| 207 | dl.block_offset = do_div(tmp, dl.block_size); |
| 208 | |
| 209 | snprintf(dl.object_name, sizeof(dl.object_name), "%llx.%08llx", |
| 210 | ceph_ino(inode), dl.object_no); |
| 211 | |
| 212 | oloc.pool = ci->i_layout.pool_id; |
| 213 | oloc.pool_ns = ceph_try_get_string(ci->i_layout.pool_ns); |
| 214 | ceph_oid_printf(&oid, "%s", dl.object_name); |
| 215 | |
| 216 | r = ceph_object_locator_to_pg(osdc->osdmap, &oid, &oloc, &pgid); |
| 217 | |
| 218 | ceph_oloc_destroy(&oloc); |
| 219 | if (r < 0) { |
| 220 | up_read(&osdc->lock); |
| 221 | return r; |
| 222 | } |
| 223 | |
| 224 | dl.osd = ceph_pg_to_acting_primary(osdc->osdmap, &pgid); |
| 225 | if (dl.osd >= 0) { |
| 226 | struct ceph_entity_addr *a = |
| 227 | ceph_osd_addr(osdc->osdmap, dl.osd); |
| 228 | if (a) |
| 229 | memcpy(&dl.osd_addr, &a->in_addr, sizeof(dl.osd_addr)); |
| 230 | } else { |
| 231 | memset(&dl.osd_addr, 0, sizeof(dl.osd_addr)); |
| 232 | } |
| 233 | up_read(&osdc->lock); |
| 234 | |
| 235 | /* send result back to user */ |
| 236 | if (copy_to_user(arg, &dl, sizeof(dl))) |
| 237 | return -EFAULT; |
| 238 | |
| 239 | return 0; |
| 240 | } |
| 241 | |
| 242 | static long ceph_ioctl_lazyio(struct file *file) |
| 243 | { |
| 244 | struct ceph_file_info *fi = file->private_data; |
| 245 | struct inode *inode = file_inode(file); |
| 246 | struct ceph_inode_info *ci = ceph_inode(inode); |
| 247 | struct ceph_mds_client *mdsc = ceph_inode_to_fs_client(inode)->mdsc; |
| 248 | struct ceph_client *cl = mdsc->fsc->client; |
| 249 | |
| 250 | if ((fi->fmode & CEPH_FILE_MODE_LAZY) == 0) { |
| 251 | spin_lock(&ci->i_ceph_lock); |
| 252 | fi->fmode |= CEPH_FILE_MODE_LAZY; |
| 253 | ci->i_nr_by_mode[ffs(CEPH_FILE_MODE_LAZY)]++; |
| 254 | __ceph_touch_fmode(ci, mdsc, fi->fmode); |
| 255 | spin_unlock(&ci->i_ceph_lock); |
| 256 | doutc(cl, "file %p %p %llx.%llx marked lazy\n", file, inode, |
| 257 | ceph_vinop(inode)); |
| 258 | |
| 259 | ceph_check_caps(ci, 0); |
| 260 | } else { |
| 261 | doutc(cl, "file %p %p %llx.%llx already lazy\n", file, inode, |
| 262 | ceph_vinop(inode)); |
| 263 | } |
| 264 | return 0; |
| 265 | } |
| 266 | |
| 267 | static long ceph_ioctl_syncio(struct file *file) |
| 268 | { |
| 269 | struct ceph_file_info *fi = file->private_data; |
| 270 | |
| 271 | fi->flags |= CEPH_F_SYNC; |
| 272 | return 0; |
| 273 | } |
| 274 | |
| 275 | static int vet_mds_for_fscrypt(struct file *file) |
| 276 | { |
| 277 | int i, ret = -EOPNOTSUPP; |
| 278 | struct ceph_mds_client *mdsc = ceph_sb_to_mdsc(file_inode(file)->i_sb); |
| 279 | |
| 280 | mutex_lock(&mdsc->mutex); |
| 281 | for (i = 0; i < mdsc->max_sessions; i++) { |
| 282 | struct ceph_mds_session *s = mdsc->sessions[i]; |
| 283 | |
| 284 | if (!s) |
| 285 | continue; |
| 286 | if (test_bit(CEPHFS_FEATURE_ALTERNATE_NAME, &s->s_features)) |
| 287 | ret = 0; |
| 288 | break; |
| 289 | } |
| 290 | mutex_unlock(&mdsc->mutex); |
| 291 | return ret; |
| 292 | } |
| 293 | |
| 294 | static long ceph_set_encryption_policy(struct file *file, unsigned long arg) |
| 295 | { |
| 296 | int ret, got = 0; |
| 297 | struct inode *inode = file_inode(file); |
| 298 | struct ceph_inode_info *ci = ceph_inode(inode); |
| 299 | |
| 300 | /* encrypted directories can't have striped layout */ |
| 301 | if (ci->i_layout.stripe_count > 1) |
| 302 | return -EINVAL; |
| 303 | |
| 304 | ret = vet_mds_for_fscrypt(file); |
| 305 | if (ret) |
| 306 | return ret; |
| 307 | |
| 308 | /* |
| 309 | * Ensure we hold these caps so that we _know_ that the rstats check |
| 310 | * in the empty_dir check is reliable. |
| 311 | */ |
| 312 | ret = ceph_get_caps(file, CEPH_CAP_FILE_SHARED, 0, -1, &got); |
| 313 | if (ret) |
| 314 | return ret; |
| 315 | |
| 316 | ret = fscrypt_ioctl_set_policy(file, (const void __user *)arg); |
| 317 | if (got) |
| 318 | ceph_put_cap_refs(ci, got); |
| 319 | |
| 320 | return ret; |
| 321 | } |
| 322 | |
| 323 | static const char *ceph_ioctl_cmd_name(const unsigned int cmd) |
| 324 | { |
| 325 | switch (cmd) { |
| 326 | case CEPH_IOC_GET_LAYOUT: |
| 327 | return "get_layout"; |
| 328 | case CEPH_IOC_SET_LAYOUT: |
| 329 | return "set_layout"; |
| 330 | case CEPH_IOC_SET_LAYOUT_POLICY: |
| 331 | return "set_layout_policy"; |
| 332 | case CEPH_IOC_GET_DATALOC: |
| 333 | return "get_dataloc"; |
| 334 | case CEPH_IOC_LAZYIO: |
| 335 | return "lazyio"; |
| 336 | case CEPH_IOC_SYNCIO: |
| 337 | return "syncio"; |
| 338 | case FS_IOC_SET_ENCRYPTION_POLICY: |
| 339 | return "set_encryption_policy"; |
| 340 | case FS_IOC_GET_ENCRYPTION_POLICY: |
| 341 | return "get_encryption_policy"; |
| 342 | case FS_IOC_GET_ENCRYPTION_POLICY_EX: |
| 343 | return "get_encryption_policy_ex"; |
| 344 | case FS_IOC_ADD_ENCRYPTION_KEY: |
| 345 | return "add_encryption_key"; |
| 346 | case FS_IOC_REMOVE_ENCRYPTION_KEY: |
| 347 | return "remove_encryption_key"; |
| 348 | case FS_IOC_REMOVE_ENCRYPTION_KEY_ALL_USERS: |
| 349 | return "remove_encryption_key_all_users"; |
| 350 | case FS_IOC_GET_ENCRYPTION_KEY_STATUS: |
| 351 | return "get_encryption_key_status"; |
| 352 | case FS_IOC_GET_ENCRYPTION_NONCE: |
| 353 | return "get_encryption_nonce"; |
| 354 | default: |
| 355 | return "unknown"; |
| 356 | } |
| 357 | } |
| 358 | |
| 359 | long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg) |
| 360 | { |
| 361 | struct inode *inode = file_inode(file); |
| 362 | struct ceph_fs_client *fsc = ceph_inode_to_fs_client(inode); |
| 363 | int ret; |
| 364 | |
| 365 | doutc(fsc->client, "file %p %p %llx.%llx cmd %s arg %lu\n", file, |
| 366 | inode, ceph_vinop(inode), ceph_ioctl_cmd_name(cmd), arg); |
| 367 | switch (cmd) { |
| 368 | case CEPH_IOC_GET_LAYOUT: |
| 369 | return ceph_ioctl_get_layout(file, (void __user *)arg); |
| 370 | |
| 371 | case CEPH_IOC_SET_LAYOUT: |
| 372 | return ceph_ioctl_set_layout(file, (void __user *)arg); |
| 373 | |
| 374 | case CEPH_IOC_SET_LAYOUT_POLICY: |
| 375 | return ceph_ioctl_set_layout_policy(file, (void __user *)arg); |
| 376 | |
| 377 | case CEPH_IOC_GET_DATALOC: |
| 378 | return ceph_ioctl_get_dataloc(file, (void __user *)arg); |
| 379 | |
| 380 | case CEPH_IOC_LAZYIO: |
| 381 | return ceph_ioctl_lazyio(file); |
| 382 | |
| 383 | case CEPH_IOC_SYNCIO: |
| 384 | return ceph_ioctl_syncio(file); |
| 385 | |
| 386 | case FS_IOC_SET_ENCRYPTION_POLICY: |
| 387 | return ceph_set_encryption_policy(file, arg); |
| 388 | |
| 389 | case FS_IOC_GET_ENCRYPTION_POLICY: |
| 390 | ret = vet_mds_for_fscrypt(file); |
| 391 | if (ret) |
| 392 | return ret; |
| 393 | return fscrypt_ioctl_get_policy(file, (void __user *)arg); |
| 394 | |
| 395 | case FS_IOC_GET_ENCRYPTION_POLICY_EX: |
| 396 | ret = vet_mds_for_fscrypt(file); |
| 397 | if (ret) |
| 398 | return ret; |
| 399 | return fscrypt_ioctl_get_policy_ex(file, (void __user *)arg); |
| 400 | |
| 401 | case FS_IOC_ADD_ENCRYPTION_KEY: |
| 402 | ret = vet_mds_for_fscrypt(file); |
| 403 | if (ret) |
| 404 | return ret; |
| 405 | return fscrypt_ioctl_add_key(file, (void __user *)arg); |
| 406 | |
| 407 | case FS_IOC_REMOVE_ENCRYPTION_KEY: |
| 408 | return fscrypt_ioctl_remove_key(file, (void __user *)arg); |
| 409 | |
| 410 | case FS_IOC_REMOVE_ENCRYPTION_KEY_ALL_USERS: |
| 411 | return fscrypt_ioctl_remove_key_all_users(file, |
| 412 | (void __user *)arg); |
| 413 | |
| 414 | case FS_IOC_GET_ENCRYPTION_KEY_STATUS: |
| 415 | return fscrypt_ioctl_get_key_status(file, (void __user *)arg); |
| 416 | |
| 417 | case FS_IOC_GET_ENCRYPTION_NONCE: |
| 418 | ret = vet_mds_for_fscrypt(file); |
| 419 | if (ret) |
| 420 | return ret; |
| 421 | return fscrypt_ioctl_get_nonce(file, (void __user *)arg); |
| 422 | } |
| 423 | |
| 424 | return -ENOTTY; |
| 425 | } |