bsg: cdev lock_kernel() pushdown
[linux-block.git] / block / bsg.c
CommitLineData
3d6392cf 1/*
0c6a89ba 2 * bsg.c - block layer implementation of the sg v4 interface
3d6392cf
JA
3 *
4 * Copyright (C) 2004 Jens Axboe <axboe@suse.de> SUSE Labs
5 * Copyright (C) 2004 Peter M. Jones <pjones@redhat.com>
6 *
7 * This file is subject to the terms and conditions of the GNU General Public
8 * License version 2. See the file "COPYING" in the main directory of this
9 * archive for more details.
10 *
11 */
3d6392cf
JA
12#include <linux/module.h>
13#include <linux/init.h>
14#include <linux/file.h>
15#include <linux/blkdev.h>
16#include <linux/poll.h>
17#include <linux/cdev.h>
18#include <linux/percpu.h>
19#include <linux/uio.h>
598443a2 20#include <linux/idr.h>
3d6392cf 21#include <linux/bsg.h>
75bd2ef1 22#include <linux/smp_lock.h>
3d6392cf
JA
23
24#include <scsi/scsi.h>
25#include <scsi/scsi_ioctl.h>
26#include <scsi/scsi_cmnd.h>
4e2872d6
FT
27#include <scsi/scsi_device.h>
28#include <scsi/scsi_driver.h>
3d6392cf
JA
29#include <scsi/sg.h>
30
0ed081ce
FT
31#define BSG_DESCRIPTION "Block layer SCSI generic (bsg) driver"
32#define BSG_VERSION "0.4"
3d6392cf 33
3d6392cf 34struct bsg_device {
165125e1 35 struct request_queue *queue;
3d6392cf
JA
36 spinlock_t lock;
37 struct list_head busy_list;
38 struct list_head done_list;
39 struct hlist_node dev_list;
40 atomic_t ref_count;
3d6392cf
JA
41 int queued_cmds;
42 int done_cmds;
3d6392cf
JA
43 wait_queue_head_t wq_done;
44 wait_queue_head_t wq_free;
d351af01 45 char name[BUS_ID_SIZE];
3d6392cf
JA
46 int max_queue;
47 unsigned long flags;
48};
49
50enum {
51 BSG_F_BLOCK = 1,
52 BSG_F_WRITE_PERM = 2,
53};
54
5309cb38 55#define BSG_DEFAULT_CMDS 64
292b7f27 56#define BSG_MAX_DEVS 32768
3d6392cf
JA
57
58#undef BSG_DEBUG
59
60#ifdef BSG_DEBUG
24c03d47 61#define dprintk(fmt, args...) printk(KERN_ERR "%s: " fmt, __func__, ##args)
3d6392cf
JA
62#else
63#define dprintk(fmt, args...)
64#endif
65
3d6392cf 66static DEFINE_MUTEX(bsg_mutex);
598443a2 67static DEFINE_IDR(bsg_minor_idr);
3d6392cf 68
25fd1643 69#define BSG_LIST_ARRAY_SIZE 8
25fd1643 70static struct hlist_head bsg_device_list[BSG_LIST_ARRAY_SIZE];
3d6392cf
JA
71
72static struct class *bsg_class;
46f6ef4a 73static int bsg_major;
3d6392cf 74
5309cb38
JA
75static struct kmem_cache *bsg_cmd_cachep;
76
3d6392cf
JA
77/*
78 * our internal command type
79 */
80struct bsg_command {
81 struct bsg_device *bd;
82 struct list_head list;
83 struct request *rq;
84 struct bio *bio;
2c9ecdf4 85 struct bio *bidi_bio;
3d6392cf 86 int err;
70e36ece 87 struct sg_io_v4 hdr;
3d6392cf
JA
88 char sense[SCSI_SENSE_BUFFERSIZE];
89};
90
91static void bsg_free_command(struct bsg_command *bc)
92{
93 struct bsg_device *bd = bc->bd;
3d6392cf
JA
94 unsigned long flags;
95
5309cb38 96 kmem_cache_free(bsg_cmd_cachep, bc);
3d6392cf
JA
97
98 spin_lock_irqsave(&bd->lock, flags);
99 bd->queued_cmds--;
3d6392cf
JA
100 spin_unlock_irqrestore(&bd->lock, flags);
101
102 wake_up(&bd->wq_free);
103}
104
e7d72173 105static struct bsg_command *bsg_alloc_command(struct bsg_device *bd)
3d6392cf 106{
e7d72173 107 struct bsg_command *bc = ERR_PTR(-EINVAL);
3d6392cf
JA
108
109 spin_lock_irq(&bd->lock);
110
111 if (bd->queued_cmds >= bd->max_queue)
112 goto out;
113
3d6392cf 114 bd->queued_cmds++;
3d6392cf
JA
115 spin_unlock_irq(&bd->lock);
116
25fd1643 117 bc = kmem_cache_zalloc(bsg_cmd_cachep, GFP_KERNEL);
5309cb38
JA
118 if (unlikely(!bc)) {
119 spin_lock_irq(&bd->lock);
7e75d730 120 bd->queued_cmds--;
e7d72173 121 bc = ERR_PTR(-ENOMEM);
7e75d730 122 goto out;
5309cb38
JA
123 }
124
3d6392cf
JA
125 bc->bd = bd;
126 INIT_LIST_HEAD(&bc->list);
5309cb38 127 dprintk("%s: returning free cmd %p\n", bd->name, bc);
3d6392cf
JA
128 return bc;
129out:
3d6392cf
JA
130 spin_unlock_irq(&bd->lock);
131 return bc;
132}
133
1c1133e1 134static inline struct hlist_head *bsg_dev_idx_hash(int index)
3d6392cf 135{
1c1133e1 136 return &bsg_device_list[index & (BSG_LIST_ARRAY_SIZE - 1)];
3d6392cf
JA
137}
138
25fd1643 139static int bsg_io_schedule(struct bsg_device *bd)
3d6392cf
JA
140{
141 DEFINE_WAIT(wait);
142 int ret = 0;
143
144 spin_lock_irq(&bd->lock);
145
146 BUG_ON(bd->done_cmds > bd->queued_cmds);
147
148 /*
149 * -ENOSPC or -ENODATA? I'm going for -ENODATA, meaning "I have no
150 * work to do", even though we return -ENOSPC after this same test
151 * during bsg_write() -- there, it means our buffer can't have more
152 * bsg_commands added to it, thus has no space left.
153 */
154 if (bd->done_cmds == bd->queued_cmds) {
155 ret = -ENODATA;
156 goto unlock;
157 }
158
159 if (!test_bit(BSG_F_BLOCK, &bd->flags)) {
160 ret = -EAGAIN;
161 goto unlock;
162 }
163
25fd1643 164 prepare_to_wait(&bd->wq_done, &wait, TASK_UNINTERRUPTIBLE);
3d6392cf
JA
165 spin_unlock_irq(&bd->lock);
166 io_schedule();
167 finish_wait(&bd->wq_done, &wait);
168
3d6392cf
JA
169 return ret;
170unlock:
171 spin_unlock_irq(&bd->lock);
172 return ret;
173}
174
165125e1 175static int blk_fill_sgv4_hdr_rq(struct request_queue *q, struct request *rq,
70e36ece
FT
176 struct sg_io_v4 *hdr, int has_write_perm)
177{
9f5de6b1
FT
178 if (hdr->request_len > BLK_MAX_CDB) {
179 rq->cmd = kzalloc(hdr->request_len, GFP_KERNEL);
180 if (!rq->cmd)
181 return -ENOMEM;
182 }
70e36ece
FT
183
184 if (copy_from_user(rq->cmd, (void *)(unsigned long)hdr->request,
185 hdr->request_len))
186 return -EFAULT;
15d10b61
FT
187
188 if (hdr->subprotocol == BSG_SUB_PROTOCOL_SCSI_CMD) {
189 if (blk_verify_command(rq->cmd, has_write_perm))
190 return -EPERM;
191 } else if (!capable(CAP_SYS_RAWIO))
70e36ece
FT
192 return -EPERM;
193
194 /*
195 * fill in request structure
196 */
197 rq->cmd_len = hdr->request_len;
198 rq->cmd_type = REQ_TYPE_BLOCK_PC;
199
200 rq->timeout = (hdr->timeout * HZ) / 1000;
201 if (!rq->timeout)
202 rq->timeout = q->sg_timeout;
203 if (!rq->timeout)
204 rq->timeout = BLK_DEFAULT_SG_TIMEOUT;
205
206 return 0;
207}
208
3d6392cf 209/*
70e36ece 210 * Check if sg_io_v4 from user is allowed and valid
3d6392cf
JA
211 */
212static int
165125e1 213bsg_validate_sgv4_hdr(struct request_queue *q, struct sg_io_v4 *hdr, int *rw)
3d6392cf 214{
15d10b61
FT
215 int ret = 0;
216
70e36ece 217 if (hdr->guard != 'Q')
3d6392cf 218 return -EINVAL;
70e36ece
FT
219 if (hdr->dout_xfer_len > (q->max_sectors << 9) ||
220 hdr->din_xfer_len > (q->max_sectors << 9))
3d6392cf
JA
221 return -EIO;
222
15d10b61
FT
223 switch (hdr->protocol) {
224 case BSG_PROTOCOL_SCSI:
225 switch (hdr->subprotocol) {
226 case BSG_SUB_PROTOCOL_SCSI_CMD:
227 case BSG_SUB_PROTOCOL_SCSI_TRANSPORT:
228 break;
229 default:
230 ret = -EINVAL;
231 }
232 break;
233 default:
234 ret = -EINVAL;
235 }
70e36ece 236
70e36ece 237 *rw = hdr->dout_xfer_len ? WRITE : READ;
15d10b61 238 return ret;
3d6392cf
JA
239}
240
241/*
70e36ece 242 * map sg_io_v4 to a request.
3d6392cf
JA
243 */
244static struct request *
70e36ece 245bsg_map_hdr(struct bsg_device *bd, struct sg_io_v4 *hdr)
3d6392cf 246{
165125e1 247 struct request_queue *q = bd->queue;
2c9ecdf4 248 struct request *rq, *next_rq = NULL;
25fd1643 249 int ret, rw;
70e36ece
FT
250 unsigned int dxfer_len;
251 void *dxferp = NULL;
3d6392cf 252
70e36ece
FT
253 dprintk("map hdr %llx/%u %llx/%u\n", (unsigned long long) hdr->dout_xferp,
254 hdr->dout_xfer_len, (unsigned long long) hdr->din_xferp,
255 hdr->din_xfer_len);
3d6392cf 256
70e36ece 257 ret = bsg_validate_sgv4_hdr(q, hdr, &rw);
3d6392cf
JA
258 if (ret)
259 return ERR_PTR(ret);
260
261 /*
262 * map scatter-gather elements seperately and string them to request
263 */
264 rq = blk_get_request(q, rw, GFP_KERNEL);
2c9ecdf4
FT
265 if (!rq)
266 return ERR_PTR(-ENOMEM);
70e36ece
FT
267 ret = blk_fill_sgv4_hdr_rq(q, rq, hdr, test_bit(BSG_F_WRITE_PERM,
268 &bd->flags));
2c9ecdf4
FT
269 if (ret)
270 goto out;
271
272 if (rw == WRITE && hdr->din_xfer_len) {
273 if (!test_bit(QUEUE_FLAG_BIDI, &q->queue_flags)) {
274 ret = -EOPNOTSUPP;
275 goto out;
276 }
277
278 next_rq = blk_get_request(q, READ, GFP_KERNEL);
279 if (!next_rq) {
280 ret = -ENOMEM;
281 goto out;
282 }
283 rq->next_rq = next_rq;
40f62028 284 next_rq->cmd_type = rq->cmd_type;
2c9ecdf4
FT
285
286 dxferp = (void*)(unsigned long)hdr->din_xferp;
287 ret = blk_rq_map_user(q, next_rq, dxferp, hdr->din_xfer_len);
288 if (ret)
289 goto out;
3d6392cf
JA
290 }
291
70e36ece
FT
292 if (hdr->dout_xfer_len) {
293 dxfer_len = hdr->dout_xfer_len;
294 dxferp = (void*)(unsigned long)hdr->dout_xferp;
295 } else if (hdr->din_xfer_len) {
296 dxfer_len = hdr->din_xfer_len;
297 dxferp = (void*)(unsigned long)hdr->din_xferp;
298 } else
299 dxfer_len = 0;
300
301 if (dxfer_len) {
302 ret = blk_rq_map_user(q, rq, dxferp, dxfer_len);
2c9ecdf4
FT
303 if (ret)
304 goto out;
3d6392cf 305 }
3d6392cf 306 return rq;
2c9ecdf4 307out:
9f5de6b1
FT
308 if (rq->cmd != rq->__cmd)
309 kfree(rq->cmd);
2c9ecdf4
FT
310 blk_put_request(rq);
311 if (next_rq) {
312 blk_rq_unmap_user(next_rq->bio);
313 blk_put_request(next_rq);
314 }
315 return ERR_PTR(ret);
3d6392cf
JA
316}
317
318/*
319 * async completion call-back from the block layer, when scsi/ide/whatever
320 * calls end_that_request_last() on a request
321 */
322static void bsg_rq_end_io(struct request *rq, int uptodate)
323{
324 struct bsg_command *bc = rq->end_io_data;
325 struct bsg_device *bd = bc->bd;
326 unsigned long flags;
327
5309cb38
JA
328 dprintk("%s: finished rq %p bc %p, bio %p stat %d\n",
329 bd->name, rq, bc, bc->bio, uptodate);
3d6392cf
JA
330
331 bc->hdr.duration = jiffies_to_msecs(jiffies - bc->hdr.duration);
332
333 spin_lock_irqsave(&bd->lock, flags);
25fd1643
JA
334 list_move_tail(&bc->list, &bd->done_list);
335 bd->done_cmds++;
3d6392cf 336 spin_unlock_irqrestore(&bd->lock, flags);
25fd1643
JA
337
338 wake_up(&bd->wq_done);
3d6392cf
JA
339}
340
341/*
342 * do final setup of a 'bc' and submit the matching 'rq' to the block
343 * layer for io
344 */
165125e1 345static void bsg_add_command(struct bsg_device *bd, struct request_queue *q,
3d6392cf
JA
346 struct bsg_command *bc, struct request *rq)
347{
348 rq->sense = bc->sense;
349 rq->sense_len = 0;
350
351 /*
352 * add bc command to busy queue and submit rq for io
353 */
354 bc->rq = rq;
355 bc->bio = rq->bio;
2c9ecdf4
FT
356 if (rq->next_rq)
357 bc->bidi_bio = rq->next_rq->bio;
3d6392cf
JA
358 bc->hdr.duration = jiffies;
359 spin_lock_irq(&bd->lock);
360 list_add_tail(&bc->list, &bd->busy_list);
361 spin_unlock_irq(&bd->lock);
362
363 dprintk("%s: queueing rq %p, bc %p\n", bd->name, rq, bc);
364
365 rq->end_io_data = bc;
d351af01 366 blk_execute_rq_nowait(q, NULL, rq, 1, bsg_rq_end_io);
3d6392cf
JA
367}
368
25fd1643 369static struct bsg_command *bsg_next_done_cmd(struct bsg_device *bd)
3d6392cf
JA
370{
371 struct bsg_command *bc = NULL;
372
373 spin_lock_irq(&bd->lock);
374 if (bd->done_cmds) {
43ac9e62 375 bc = list_first_entry(&bd->done_list, struct bsg_command, list);
25fd1643
JA
376 list_del(&bc->list);
377 bd->done_cmds--;
3d6392cf
JA
378 }
379 spin_unlock_irq(&bd->lock);
380
381 return bc;
382}
383
384/*
385 * Get a finished command from the done list
386 */
e7d72173 387static struct bsg_command *bsg_get_done_cmd(struct bsg_device *bd)
3d6392cf
JA
388{
389 struct bsg_command *bc;
390 int ret;
391
392 do {
393 bc = bsg_next_done_cmd(bd);
394 if (bc)
395 break;
396
e7d72173
FT
397 if (!test_bit(BSG_F_BLOCK, &bd->flags)) {
398 bc = ERR_PTR(-EAGAIN);
399 break;
400 }
401
402 ret = wait_event_interruptible(bd->wq_done, bd->done_cmds);
3d6392cf 403 if (ret) {
e7d72173 404 bc = ERR_PTR(-ERESTARTSYS);
3d6392cf
JA
405 break;
406 }
407 } while (1);
408
409 dprintk("%s: returning done %p\n", bd->name, bc);
410
411 return bc;
412}
413
70e36ece 414static int blk_complete_sgv4_hdr_rq(struct request *rq, struct sg_io_v4 *hdr,
2c9ecdf4 415 struct bio *bio, struct bio *bidi_bio)
70e36ece
FT
416{
417 int ret = 0;
418
419 dprintk("rq %p bio %p %u\n", rq, bio, rq->errors);
420 /*
421 * fill in all the output members
422 */
423 hdr->device_status = status_byte(rq->errors);
424 hdr->transport_status = host_byte(rq->errors);
425 hdr->driver_status = driver_byte(rq->errors);
426 hdr->info = 0;
427 if (hdr->device_status || hdr->transport_status || hdr->driver_status)
428 hdr->info |= SG_INFO_CHECK;
70e36ece
FT
429 hdr->response_len = 0;
430
431 if (rq->sense_len && hdr->response) {
25fd1643
JA
432 int len = min_t(unsigned int, hdr->max_response_len,
433 rq->sense_len);
70e36ece
FT
434
435 ret = copy_to_user((void*)(unsigned long)hdr->response,
436 rq->sense, len);
437 if (!ret)
438 hdr->response_len = len;
439 else
440 ret = -EFAULT;
441 }
442
2c9ecdf4 443 if (rq->next_rq) {
7a85f889
FT
444 hdr->dout_resid = rq->data_len;
445 hdr->din_resid = rq->next_rq->data_len;
2c9ecdf4
FT
446 blk_rq_unmap_user(bidi_bio);
447 blk_put_request(rq->next_rq);
0c6a89ba 448 } else if (rq_data_dir(rq) == READ)
7a85f889 449 hdr->din_resid = rq->data_len;
0c6a89ba 450 else
7a85f889 451 hdr->dout_resid = rq->data_len;
2c9ecdf4 452
2d507a01
JB
453 /*
454 * If the request generated a negative error number, return it
455 * (providing we aren't already returning an error); if it's
456 * just a protocol response (i.e. non negative), that gets
457 * processed above.
458 */
459 if (!ret && rq->errors < 0)
460 ret = rq->errors;
461
70e36ece 462 blk_rq_unmap_user(bio);
9f5de6b1
FT
463 if (rq->cmd != rq->__cmd)
464 kfree(rq->cmd);
70e36ece
FT
465 blk_put_request(rq);
466
467 return ret;
468}
469
3d6392cf
JA
470static int bsg_complete_all_commands(struct bsg_device *bd)
471{
472 struct bsg_command *bc;
473 int ret, tret;
474
475 dprintk("%s: entered\n", bd->name);
476
3d6392cf
JA
477 /*
478 * wait for all commands to complete
479 */
480 ret = 0;
481 do {
25fd1643 482 ret = bsg_io_schedule(bd);
3d6392cf
JA
483 /*
484 * look for -ENODATA specifically -- we'll sometimes get
485 * -ERESTARTSYS when we've taken a signal, but we can't
486 * return until we're done freeing the queue, so ignore
487 * it. The signal will get handled when we're done freeing
488 * the bsg_device.
489 */
490 } while (ret != -ENODATA);
491
492 /*
493 * discard done commands
494 */
495 ret = 0;
496 do {
e7d72173
FT
497 spin_lock_irq(&bd->lock);
498 if (!bd->queued_cmds) {
499 spin_unlock_irq(&bd->lock);
3d6392cf
JA
500 break;
501 }
efba1a31 502 spin_unlock_irq(&bd->lock);
3d6392cf 503
e7d72173
FT
504 bc = bsg_get_done_cmd(bd);
505 if (IS_ERR(bc))
506 break;
507
2c9ecdf4
FT
508 tret = blk_complete_sgv4_hdr_rq(bc->rq, &bc->hdr, bc->bio,
509 bc->bidi_bio);
3d6392cf
JA
510 if (!ret)
511 ret = tret;
512
513 bsg_free_command(bc);
514 } while (1);
515
516 return ret;
517}
518
25fd1643 519static int
e7d72173
FT
520__bsg_read(char __user *buf, size_t count, struct bsg_device *bd,
521 const struct iovec *iov, ssize_t *bytes_read)
3d6392cf
JA
522{
523 struct bsg_command *bc;
524 int nr_commands, ret;
525
70e36ece 526 if (count % sizeof(struct sg_io_v4))
3d6392cf
JA
527 return -EINVAL;
528
529 ret = 0;
70e36ece 530 nr_commands = count / sizeof(struct sg_io_v4);
3d6392cf 531 while (nr_commands) {
e7d72173 532 bc = bsg_get_done_cmd(bd);
3d6392cf
JA
533 if (IS_ERR(bc)) {
534 ret = PTR_ERR(bc);
535 break;
536 }
537
538 /*
539 * this is the only case where we need to copy data back
540 * after completing the request. so do that here,
541 * bsg_complete_work() cannot do that for us
542 */
2c9ecdf4
FT
543 ret = blk_complete_sgv4_hdr_rq(bc->rq, &bc->hdr, bc->bio,
544 bc->bidi_bio);
3d6392cf 545
25fd1643 546 if (copy_to_user(buf, &bc->hdr, sizeof(bc->hdr)))
3d6392cf
JA
547 ret = -EFAULT;
548
549 bsg_free_command(bc);
550
551 if (ret)
552 break;
553
70e36ece
FT
554 buf += sizeof(struct sg_io_v4);
555 *bytes_read += sizeof(struct sg_io_v4);
3d6392cf
JA
556 nr_commands--;
557 }
558
559 return ret;
560}
561
562static inline void bsg_set_block(struct bsg_device *bd, struct file *file)
563{
564 if (file->f_flags & O_NONBLOCK)
565 clear_bit(BSG_F_BLOCK, &bd->flags);
566 else
567 set_bit(BSG_F_BLOCK, &bd->flags);
568}
569
570static inline void bsg_set_write_perm(struct bsg_device *bd, struct file *file)
571{
572 if (file->f_mode & FMODE_WRITE)
573 set_bit(BSG_F_WRITE_PERM, &bd->flags);
574 else
575 clear_bit(BSG_F_WRITE_PERM, &bd->flags);
576}
577
25fd1643
JA
578/*
579 * Check if the error is a "real" error that we should return.
580 */
3d6392cf
JA
581static inline int err_block_err(int ret)
582{
583 if (ret && ret != -ENOSPC && ret != -ENODATA && ret != -EAGAIN)
584 return 1;
585
586 return 0;
587}
588
589static ssize_t
590bsg_read(struct file *file, char __user *buf, size_t count, loff_t *ppos)
591{
592 struct bsg_device *bd = file->private_data;
593 int ret;
594 ssize_t bytes_read;
595
9e69fbb5 596 dprintk("%s: read %Zd bytes\n", bd->name, count);
3d6392cf
JA
597
598 bsg_set_block(bd, file);
599 bytes_read = 0;
e7d72173 600 ret = __bsg_read(buf, count, bd, NULL, &bytes_read);
3d6392cf
JA
601 *ppos = bytes_read;
602
603 if (!bytes_read || (bytes_read && err_block_err(ret)))
604 bytes_read = ret;
605
606 return bytes_read;
607}
608
25fd1643
JA
609static int __bsg_write(struct bsg_device *bd, const char __user *buf,
610 size_t count, ssize_t *bytes_written)
3d6392cf
JA
611{
612 struct bsg_command *bc;
613 struct request *rq;
614 int ret, nr_commands;
615
70e36ece 616 if (count % sizeof(struct sg_io_v4))
3d6392cf
JA
617 return -EINVAL;
618
70e36ece 619 nr_commands = count / sizeof(struct sg_io_v4);
3d6392cf
JA
620 rq = NULL;
621 bc = NULL;
622 ret = 0;
623 while (nr_commands) {
165125e1 624 struct request_queue *q = bd->queue;
3d6392cf 625
e7d72173 626 bc = bsg_alloc_command(bd);
3d6392cf
JA
627 if (IS_ERR(bc)) {
628 ret = PTR_ERR(bc);
629 bc = NULL;
630 break;
631 }
632
3d6392cf
JA
633 if (copy_from_user(&bc->hdr, buf, sizeof(bc->hdr))) {
634 ret = -EFAULT;
635 break;
636 }
637
638 /*
639 * get a request, fill in the blanks, and add to request queue
640 */
70e36ece 641 rq = bsg_map_hdr(bd, &bc->hdr);
3d6392cf
JA
642 if (IS_ERR(rq)) {
643 ret = PTR_ERR(rq);
644 rq = NULL;
645 break;
646 }
647
648 bsg_add_command(bd, q, bc, rq);
649 bc = NULL;
650 rq = NULL;
651 nr_commands--;
70e36ece 652 buf += sizeof(struct sg_io_v4);
25fd1643 653 *bytes_written += sizeof(struct sg_io_v4);
3d6392cf
JA
654 }
655
3d6392cf
JA
656 if (bc)
657 bsg_free_command(bc);
658
659 return ret;
660}
661
662static ssize_t
663bsg_write(struct file *file, const char __user *buf, size_t count, loff_t *ppos)
664{
665 struct bsg_device *bd = file->private_data;
25fd1643 666 ssize_t bytes_written;
3d6392cf
JA
667 int ret;
668
9e69fbb5 669 dprintk("%s: write %Zd bytes\n", bd->name, count);
3d6392cf
JA
670
671 bsg_set_block(bd, file);
672 bsg_set_write_perm(bd, file);
673
25fd1643
JA
674 bytes_written = 0;
675 ret = __bsg_write(bd, buf, count, &bytes_written);
676 *ppos = bytes_written;
3d6392cf
JA
677
678 /*
679 * return bytes written on non-fatal errors
680 */
25fd1643
JA
681 if (!bytes_written || (bytes_written && err_block_err(ret)))
682 bytes_written = ret;
3d6392cf 683
25fd1643
JA
684 dprintk("%s: returning %Zd\n", bd->name, bytes_written);
685 return bytes_written;
3d6392cf
JA
686}
687
3d6392cf
JA
688static struct bsg_device *bsg_alloc_device(void)
689{
3d6392cf 690 struct bsg_device *bd;
3d6392cf
JA
691
692 bd = kzalloc(sizeof(struct bsg_device), GFP_KERNEL);
693 if (unlikely(!bd))
694 return NULL;
695
696 spin_lock_init(&bd->lock);
697
5309cb38 698 bd->max_queue = BSG_DEFAULT_CMDS;
3d6392cf
JA
699
700 INIT_LIST_HEAD(&bd->busy_list);
701 INIT_LIST_HEAD(&bd->done_list);
702 INIT_HLIST_NODE(&bd->dev_list);
703
704 init_waitqueue_head(&bd->wq_free);
705 init_waitqueue_head(&bd->wq_done);
706 return bd;
3d6392cf
JA
707}
708
97f46ae4
FT
709static void bsg_kref_release_function(struct kref *kref)
710{
711 struct bsg_class_device *bcd =
712 container_of(kref, struct bsg_class_device, ref);
713
714 if (bcd->release)
715 bcd->release(bcd->parent);
716
717 put_device(bcd->parent);
718}
719
3d6392cf
JA
720static int bsg_put_device(struct bsg_device *bd)
721{
97f46ae4
FT
722 int ret = 0, do_free;
723 struct request_queue *q = bd->queue;
3d6392cf
JA
724
725 mutex_lock(&bsg_mutex);
726
97f46ae4
FT
727 do_free = atomic_dec_and_test(&bd->ref_count);
728 if (!do_free)
3d6392cf
JA
729 goto out;
730
731 dprintk("%s: tearing down\n", bd->name);
732
733 /*
734 * close can always block
735 */
736 set_bit(BSG_F_BLOCK, &bd->flags);
737
738 /*
739 * correct error detection baddies here again. it's the responsibility
740 * of the app to properly reap commands before close() if it wants
741 * fool-proof error detection
742 */
743 ret = bsg_complete_all_commands(bd);
744
3d6392cf 745 hlist_del(&bd->dev_list);
5309cb38 746 kfree(bd);
3d6392cf
JA
747out:
748 mutex_unlock(&bsg_mutex);
97f46ae4
FT
749 kref_put(&q->bsg_dev.ref, bsg_kref_release_function);
750 if (do_free)
751 blk_put_queue(q);
3d6392cf
JA
752 return ret;
753}
754
755static struct bsg_device *bsg_add_device(struct inode *inode,
d351af01 756 struct request_queue *rq,
3d6392cf
JA
757 struct file *file)
758{
25fd1643 759 struct bsg_device *bd;
c3ff1b90 760 int ret;
3d6392cf
JA
761#ifdef BSG_DEBUG
762 unsigned char buf[32];
763#endif
c3ff1b90
FT
764 ret = blk_get_queue(rq);
765 if (ret)
766 return ERR_PTR(-ENXIO);
3d6392cf
JA
767
768 bd = bsg_alloc_device();
c3ff1b90
FT
769 if (!bd) {
770 blk_put_queue(rq);
3d6392cf 771 return ERR_PTR(-ENOMEM);
c3ff1b90 772 }
3d6392cf 773
d351af01 774 bd->queue = rq;
3d6392cf
JA
775 bsg_set_block(bd, file);
776
777 atomic_set(&bd->ref_count, 1);
3d6392cf 778 mutex_lock(&bsg_mutex);
842ea771 779 hlist_add_head(&bd->dev_list, bsg_dev_idx_hash(iminor(inode)));
3d6392cf 780
ee959b00 781 strncpy(bd->name, rq->bsg_dev.class_dev->bus_id, sizeof(bd->name) - 1);
3d6392cf 782 dprintk("bound to <%s>, max queue %d\n",
9e69fbb5 783 format_dev_t(buf, inode->i_rdev), bd->max_queue);
3d6392cf
JA
784
785 mutex_unlock(&bsg_mutex);
786 return bd;
787}
788
842ea771 789static struct bsg_device *__bsg_get_device(int minor, struct request_queue *q)
3d6392cf 790{
43ac9e62 791 struct bsg_device *bd;
3d6392cf
JA
792 struct hlist_node *entry;
793
794 mutex_lock(&bsg_mutex);
795
43ac9e62 796 hlist_for_each_entry(bd, entry, bsg_dev_idx_hash(minor), dev_list) {
842ea771 797 if (bd->queue == q) {
3d6392cf 798 atomic_inc(&bd->ref_count);
43ac9e62 799 goto found;
3d6392cf 800 }
3d6392cf 801 }
43ac9e62
FT
802 bd = NULL;
803found:
3d6392cf
JA
804 mutex_unlock(&bsg_mutex);
805 return bd;
806}
807
808static struct bsg_device *bsg_get_device(struct inode *inode, struct file *file)
809{
598443a2
FT
810 struct bsg_device *bd;
811 struct bsg_class_device *bcd;
3d6392cf 812
3d6392cf
JA
813 /*
814 * find the class device
815 */
3d6392cf 816 mutex_lock(&bsg_mutex);
598443a2 817 bcd = idr_find(&bsg_minor_idr, iminor(inode));
d45ac4fa 818 if (bcd)
97f46ae4 819 kref_get(&bcd->ref);
3d6392cf
JA
820 mutex_unlock(&bsg_mutex);
821
822 if (!bcd)
823 return ERR_PTR(-ENODEV);
824
842ea771 825 bd = __bsg_get_device(iminor(inode), bcd->queue);
d45ac4fa
FT
826 if (bd)
827 return bd;
828
829 bd = bsg_add_device(inode, bcd->queue, file);
830 if (IS_ERR(bd))
97f46ae4 831 kref_put(&bcd->ref, bsg_kref_release_function);
d45ac4fa
FT
832
833 return bd;
3d6392cf
JA
834}
835
836static int bsg_open(struct inode *inode, struct file *file)
837{
75bd2ef1
JC
838 struct bsg_device *bd;
839
840 lock_kernel();
841 bd = bsg_get_device(inode, file);
842 unlock_kernel();
3d6392cf
JA
843
844 if (IS_ERR(bd))
845 return PTR_ERR(bd);
846
847 file->private_data = bd;
848 return 0;
849}
850
851static int bsg_release(struct inode *inode, struct file *file)
852{
853 struct bsg_device *bd = file->private_data;
854
855 file->private_data = NULL;
856 return bsg_put_device(bd);
857}
858
859static unsigned int bsg_poll(struct file *file, poll_table *wait)
860{
861 struct bsg_device *bd = file->private_data;
862 unsigned int mask = 0;
863
864 poll_wait(file, &bd->wq_done, wait);
865 poll_wait(file, &bd->wq_free, wait);
866
867 spin_lock_irq(&bd->lock);
868 if (!list_empty(&bd->done_list))
869 mask |= POLLIN | POLLRDNORM;
870 if (bd->queued_cmds >= bd->max_queue)
871 mask |= POLLOUT;
872 spin_unlock_irq(&bd->lock);
873
874 return mask;
875}
876
25fd1643 877static long bsg_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
3d6392cf
JA
878{
879 struct bsg_device *bd = file->private_data;
880 int __user *uarg = (int __user *) arg;
2d507a01 881 int ret;
3d6392cf 882
3d6392cf
JA
883 switch (cmd) {
884 /*
885 * our own ioctls
886 */
887 case SG_GET_COMMAND_Q:
888 return put_user(bd->max_queue, uarg);
5309cb38 889 case SG_SET_COMMAND_Q: {
3d6392cf
JA
890 int queue;
891
892 if (get_user(queue, uarg))
893 return -EFAULT;
5309cb38 894 if (queue < 1)
3d6392cf
JA
895 return -EINVAL;
896
5309cb38 897 spin_lock_irq(&bd->lock);
3d6392cf 898 bd->max_queue = queue;
5309cb38 899 spin_unlock_irq(&bd->lock);
3d6392cf
JA
900 return 0;
901 }
902
903 /*
904 * SCSI/sg ioctls
905 */
906 case SG_GET_VERSION_NUM:
907 case SCSI_IOCTL_GET_IDLUN:
908 case SCSI_IOCTL_GET_BUS_NUMBER:
909 case SG_SET_TIMEOUT:
910 case SG_GET_TIMEOUT:
911 case SG_GET_RESERVED_SIZE:
912 case SG_SET_RESERVED_SIZE:
913 case SG_EMULATED_HOST:
3d6392cf
JA
914 case SCSI_IOCTL_SEND_COMMAND: {
915 void __user *uarg = (void __user *) arg;
d351af01 916 return scsi_cmd_ioctl(file, bd->queue, NULL, cmd, uarg);
3d6392cf 917 }
10e8855b
FT
918 case SG_IO: {
919 struct request *rq;
2c9ecdf4 920 struct bio *bio, *bidi_bio = NULL;
10e8855b
FT
921 struct sg_io_v4 hdr;
922
923 if (copy_from_user(&hdr, uarg, sizeof(hdr)))
924 return -EFAULT;
925
926 rq = bsg_map_hdr(bd, &hdr);
927 if (IS_ERR(rq))
928 return PTR_ERR(rq);
929
930 bio = rq->bio;
2c9ecdf4
FT
931 if (rq->next_rq)
932 bidi_bio = rq->next_rq->bio;
d351af01 933 blk_execute_rq(bd->queue, NULL, rq, 0);
2d507a01 934 ret = blk_complete_sgv4_hdr_rq(rq, &hdr, bio, bidi_bio);
10e8855b
FT
935
936 if (copy_to_user(uarg, &hdr, sizeof(hdr)))
937 return -EFAULT;
b711afa6 938
2d507a01 939 return ret;
10e8855b 940 }
3d6392cf
JA
941 /*
942 * block device ioctls
943 */
944 default:
945#if 0
946 return ioctl_by_bdev(bd->bdev, cmd, arg);
947#else
948 return -ENOTTY;
949#endif
950 }
951}
952
7344be05 953static const struct file_operations bsg_fops = {
3d6392cf
JA
954 .read = bsg_read,
955 .write = bsg_write,
956 .poll = bsg_poll,
957 .open = bsg_open,
958 .release = bsg_release,
25fd1643 959 .unlocked_ioctl = bsg_ioctl,
3d6392cf
JA
960 .owner = THIS_MODULE,
961};
962
d351af01 963void bsg_unregister_queue(struct request_queue *q)
3d6392cf 964{
d351af01 965 struct bsg_class_device *bcd = &q->bsg_dev;
3d6392cf 966
df468820
FT
967 if (!bcd->class_dev)
968 return;
3d6392cf
JA
969
970 mutex_lock(&bsg_mutex);
598443a2 971 idr_remove(&bsg_minor_idr, bcd->minor);
d351af01 972 sysfs_remove_link(&q->kobj, "bsg");
ee959b00 973 device_unregister(bcd->class_dev);
3d6392cf 974 bcd->class_dev = NULL;
97f46ae4 975 kref_put(&bcd->ref, bsg_kref_release_function);
3d6392cf
JA
976 mutex_unlock(&bsg_mutex);
977}
4cf0723a 978EXPORT_SYMBOL_GPL(bsg_unregister_queue);
3d6392cf 979
97f46ae4
FT
980int bsg_register_queue(struct request_queue *q, struct device *parent,
981 const char *name, void (*release)(struct device *))
3d6392cf 982{
598443a2 983 struct bsg_class_device *bcd;
3d6392cf 984 dev_t dev;
598443a2 985 int ret, minor;
ee959b00 986 struct device *class_dev = NULL;
39dca558
JB
987 const char *devname;
988
989 if (name)
990 devname = name;
991 else
97f46ae4 992 devname = parent->bus_id;
3d6392cf
JA
993
994 /*
995 * we need a proper transport to send commands, not a stacked device
996 */
997 if (!q->request_fn)
998 return 0;
999
d351af01 1000 bcd = &q->bsg_dev;
3d6392cf 1001 memset(bcd, 0, sizeof(*bcd));
3d6392cf
JA
1002
1003 mutex_lock(&bsg_mutex);
292b7f27 1004
598443a2
FT
1005 ret = idr_pre_get(&bsg_minor_idr, GFP_KERNEL);
1006 if (!ret) {
1007 ret = -ENOMEM;
1008 goto unlock;
292b7f27
FT
1009 }
1010
598443a2
FT
1011 ret = idr_get_new(&bsg_minor_idr, bcd, &minor);
1012 if (ret < 0)
1013 goto unlock;
292b7f27 1014
598443a2
FT
1015 if (minor >= BSG_MAX_DEVS) {
1016 printk(KERN_ERR "bsg: too many bsg devices\n");
1017 ret = -EINVAL;
1018 goto remove_idr;
1019 }
1020
1021 bcd->minor = minor;
d351af01 1022 bcd->queue = q;
97f46ae4
FT
1023 bcd->parent = get_device(parent);
1024 bcd->release = release;
1025 kref_init(&bcd->ref);
46f6ef4a 1026 dev = MKDEV(bsg_major, bcd->minor);
97f46ae4 1027 class_dev = device_create(bsg_class, parent, dev, "%s", devname);
4e2872d6
FT
1028 if (IS_ERR(class_dev)) {
1029 ret = PTR_ERR(class_dev);
598443a2 1030 goto put_dev;
4e2872d6
FT
1031 }
1032 bcd->class_dev = class_dev;
1033
abce891a 1034 if (q->kobj.sd) {
4e2872d6
FT
1035 ret = sysfs_create_link(&q->kobj, &bcd->class_dev->kobj, "bsg");
1036 if (ret)
598443a2 1037 goto unregister_class_dev;
4e2872d6
FT
1038 }
1039
3d6392cf
JA
1040 mutex_unlock(&bsg_mutex);
1041 return 0;
6826ee4f 1042
598443a2 1043unregister_class_dev:
ee959b00 1044 device_unregister(class_dev);
598443a2 1045put_dev:
97f46ae4 1046 put_device(parent);
598443a2
FT
1047remove_idr:
1048 idr_remove(&bsg_minor_idr, minor);
1049unlock:
264a0472 1050 mutex_unlock(&bsg_mutex);
4e2872d6
FT
1051 return ret;
1052}
4cf0723a 1053EXPORT_SYMBOL_GPL(bsg_register_queue);
4e2872d6 1054
7e7654a9 1055static struct cdev bsg_cdev;
292b7f27 1056
3d6392cf
JA
1057static int __init bsg_init(void)
1058{
1059 int ret, i;
46f6ef4a 1060 dev_t devid;
3d6392cf 1061
5309cb38 1062 bsg_cmd_cachep = kmem_cache_create("bsg_cmd",
20c2df83 1063 sizeof(struct bsg_command), 0, 0, NULL);
5309cb38
JA
1064 if (!bsg_cmd_cachep) {
1065 printk(KERN_ERR "bsg: failed creating slab cache\n");
1066 return -ENOMEM;
1067 }
1068
25fd1643 1069 for (i = 0; i < BSG_LIST_ARRAY_SIZE; i++)
3d6392cf
JA
1070 INIT_HLIST_HEAD(&bsg_device_list[i]);
1071
1072 bsg_class = class_create(THIS_MODULE, "bsg");
5309cb38 1073 if (IS_ERR(bsg_class)) {
9b9f770c
FT
1074 ret = PTR_ERR(bsg_class);
1075 goto destroy_kmemcache;
5309cb38 1076 }
3d6392cf 1077
46f6ef4a 1078 ret = alloc_chrdev_region(&devid, 0, BSG_MAX_DEVS, "bsg");
9b9f770c
FT
1079 if (ret)
1080 goto destroy_bsg_class;
292b7f27 1081
46f6ef4a
JA
1082 bsg_major = MAJOR(devid);
1083
292b7f27 1084 cdev_init(&bsg_cdev, &bsg_fops);
46f6ef4a 1085 ret = cdev_add(&bsg_cdev, MKDEV(bsg_major, 0), BSG_MAX_DEVS);
9b9f770c
FT
1086 if (ret)
1087 goto unregister_chrdev;
3d6392cf 1088
5d3a8cd3 1089 printk(KERN_INFO BSG_DESCRIPTION " version " BSG_VERSION
0ed081ce 1090 " loaded (major %d)\n", bsg_major);
3d6392cf 1091 return 0;
9b9f770c
FT
1092unregister_chrdev:
1093 unregister_chrdev_region(MKDEV(bsg_major, 0), BSG_MAX_DEVS);
1094destroy_bsg_class:
1095 class_destroy(bsg_class);
1096destroy_kmemcache:
1097 kmem_cache_destroy(bsg_cmd_cachep);
1098 return ret;
3d6392cf
JA
1099}
1100
1101MODULE_AUTHOR("Jens Axboe");
0ed081ce 1102MODULE_DESCRIPTION(BSG_DESCRIPTION);
3d6392cf
JA
1103MODULE_LICENSE("GPL");
1104
4e2872d6 1105device_initcall(bsg_init);