lightnvm: pblk: refactor init/exit sequences
[linux-2.6-block.git] / drivers / lightnvm / pblk-core.c
CommitLineData
a4bd217b
JG
1/*
2 * Copyright (C) 2016 CNEX Labs
3 * Initial release: Javier Gonzalez <javier@cnexlabs.com>
4 * Matias Bjorling <matias@cnexlabs.com>
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License version
8 * 2 as published by the Free Software Foundation.
9 *
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License for more details.
14 *
15 * pblk-core.c - pblk's core functionality
16 *
17 */
18
19#include "pblk.h"
a4bd217b 20
8bd40020
JG
21static void pblk_line_mark_bb(struct work_struct *work)
22{
23 struct pblk_line_ws *line_ws = container_of(work, struct pblk_line_ws,
24 ws);
25 struct pblk *pblk = line_ws->pblk;
26 struct nvm_tgt_dev *dev = pblk->dev;
27 struct ppa_addr *ppa = line_ws->priv;
28 int ret;
29
30 ret = nvm_set_tgt_bb_tbl(dev, ppa, 1, NVM_BLK_T_GRWN_BAD);
31 if (ret) {
32 struct pblk_line *line;
33 int pos;
34
b1bcfda1
JG
35 line = &pblk->lines[pblk_ppa_to_line(*ppa)];
36 pos = pblk_ppa_to_pos(&dev->geo, *ppa);
8bd40020
JG
37
38 pr_err("pblk: failed to mark bb, line:%d, pos:%d\n",
39 line->id, pos);
40 }
41
42 kfree(ppa);
43 mempool_free(line_ws, pblk->gen_ws_pool);
44}
45
a4bd217b
JG
46static void pblk_mark_bb(struct pblk *pblk, struct pblk_line *line,
47 struct ppa_addr *ppa)
48{
49 struct nvm_tgt_dev *dev = pblk->dev;
50 struct nvm_geo *geo = &dev->geo;
b1bcfda1 51 int pos = pblk_ppa_to_pos(geo, *ppa);
a4bd217b
JG
52
53 pr_debug("pblk: erase failed: line:%d, pos:%d\n", line->id, pos);
54 atomic_long_inc(&pblk->erase_failed);
55
a44f53fa 56 atomic_dec(&line->blk_in_line);
a4bd217b
JG
57 if (test_and_set_bit(pos, line->blk_bitmap))
58 pr_err("pblk: attempted to erase bb: line:%d, pos:%d\n",
59 line->id, pos);
60
b84ae4a8
JG
61 pblk_gen_run_ws(pblk, NULL, ppa, pblk_line_mark_bb,
62 GFP_ATOMIC, pblk->bb_wq);
a4bd217b
JG
63}
64
65static void __pblk_end_io_erase(struct pblk *pblk, struct nvm_rq *rqd)
66{
67 struct pblk_line *line;
68
b1bcfda1 69 line = &pblk->lines[pblk_ppa_to_line(rqd->ppa_addr)];
a4bd217b
JG
70 atomic_dec(&line->left_seblks);
71
72 if (rqd->error) {
73 struct ppa_addr *ppa;
74
75 ppa = kmalloc(sizeof(struct ppa_addr), GFP_ATOMIC);
76 if (!ppa)
77 return;
78
79 *ppa = rqd->ppa_addr;
80 pblk_mark_bb(pblk, line, ppa);
81 }
588726d3
JG
82
83 atomic_dec(&pblk->inflight_io);
a4bd217b
JG
84}
85
86/* Erase completion assumes that only one block is erased at the time */
87static void pblk_end_io_erase(struct nvm_rq *rqd)
88{
89 struct pblk *pblk = rqd->private;
90
a4bd217b 91 __pblk_end_io_erase(pblk, rqd);
0d880398 92 mempool_free(rqd, pblk->e_rq_pool);
a4bd217b
JG
93}
94
0880a9aa
JG
95void __pblk_map_invalidate(struct pblk *pblk, struct pblk_line *line,
96 u64 paddr)
a4bd217b
JG
97{
98 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
99 struct list_head *move_list = NULL;
100
101 /* Lines being reclaimed (GC'ed) cannot be invalidated. Before the L2P
102 * table is modified with reclaimed sectors, a check is done to endure
103 * that newer updates are not overwritten.
104 */
105 spin_lock(&line->lock);
d340121e 106 WARN_ON(line->state == PBLK_LINESTATE_FREE);
a4bd217b
JG
107
108 if (test_and_set_bit(paddr, line->invalid_bitmap)) {
109 WARN_ONCE(1, "pblk: double invalidate\n");
110 spin_unlock(&line->lock);
111 return;
112 }
dd2a4343 113 le32_add_cpu(line->vsc, -1);
a4bd217b
JG
114
115 if (line->state == PBLK_LINESTATE_CLOSED)
116 move_list = pblk_line_gc_list(pblk, line);
117 spin_unlock(&line->lock);
118
119 if (move_list) {
120 spin_lock(&l_mg->gc_lock);
121 spin_lock(&line->lock);
122 /* Prevent moving a line that has just been chosen for GC */
d340121e 123 if (line->state == PBLK_LINESTATE_GC) {
a4bd217b
JG
124 spin_unlock(&line->lock);
125 spin_unlock(&l_mg->gc_lock);
126 return;
127 }
128 spin_unlock(&line->lock);
129
130 list_move_tail(&line->list, move_list);
131 spin_unlock(&l_mg->gc_lock);
132 }
133}
134
135void pblk_map_invalidate(struct pblk *pblk, struct ppa_addr ppa)
136{
137 struct pblk_line *line;
138 u64 paddr;
139 int line_id;
140
141#ifdef CONFIG_NVM_DEBUG
142 /* Callers must ensure that the ppa points to a device address */
143 BUG_ON(pblk_addr_in_cache(ppa));
144 BUG_ON(pblk_ppa_empty(ppa));
145#endif
146
b1bcfda1 147 line_id = pblk_ppa_to_line(ppa);
a4bd217b
JG
148 line = &pblk->lines[line_id];
149 paddr = pblk_dev_ppa_to_line_addr(pblk, ppa);
150
151 __pblk_map_invalidate(pblk, line, paddr);
152}
153
a4bd217b
JG
154static void pblk_invalidate_range(struct pblk *pblk, sector_t slba,
155 unsigned int nr_secs)
156{
157 sector_t lba;
158
159 spin_lock(&pblk->trans_lock);
160 for (lba = slba; lba < slba + nr_secs; lba++) {
161 struct ppa_addr ppa;
162
163 ppa = pblk_trans_map_get(pblk, lba);
164
165 if (!pblk_addr_in_cache(ppa) && !pblk_ppa_empty(ppa))
166 pblk_map_invalidate(pblk, ppa);
167
168 pblk_ppa_set_empty(&ppa);
169 pblk_trans_map_set(pblk, lba, ppa);
170 }
171 spin_unlock(&pblk->trans_lock);
172}
173
67bf26a3
JG
174/* Caller must guarantee that the request is a valid type */
175struct nvm_rq *pblk_alloc_rqd(struct pblk *pblk, int type)
a4bd217b
JG
176{
177 mempool_t *pool;
178 struct nvm_rq *rqd;
179 int rq_size;
180
67bf26a3
JG
181 switch (type) {
182 case PBLK_WRITE:
183 case PBLK_WRITE_INT:
a4bd217b
JG
184 pool = pblk->w_rq_pool;
185 rq_size = pblk_w_rq_size;
67bf26a3
JG
186 break;
187 case PBLK_READ:
0d880398 188 pool = pblk->r_rq_pool;
084ec9ba 189 rq_size = pblk_g_rq_size;
67bf26a3
JG
190 break;
191 default:
192 pool = pblk->e_rq_pool;
193 rq_size = pblk_g_rq_size;
a4bd217b
JG
194 }
195
196 rqd = mempool_alloc(pool, GFP_KERNEL);
197 memset(rqd, 0, rq_size);
198
199 return rqd;
200}
201
67bf26a3
JG
202/* Typically used on completion path. Cannot guarantee request consistency */
203void pblk_free_rqd(struct pblk *pblk, struct nvm_rq *rqd, int type)
a4bd217b 204{
67bf26a3 205 struct nvm_tgt_dev *dev = pblk->dev;
a4bd217b
JG
206 mempool_t *pool;
207
67bf26a3
JG
208 switch (type) {
209 case PBLK_WRITE:
210 kfree(((struct pblk_c_ctx *)nvm_rq_to_pdu(rqd))->lun_bitmap);
211 case PBLK_WRITE_INT:
a4bd217b 212 pool = pblk->w_rq_pool;
67bf26a3
JG
213 break;
214 case PBLK_READ:
0d880398 215 pool = pblk->r_rq_pool;
67bf26a3
JG
216 break;
217 case PBLK_ERASE:
218 pool = pblk->e_rq_pool;
219 break;
220 default:
221 pr_err("pblk: trying to free unknown rqd type\n");
222 return;
223 }
a4bd217b 224
67bf26a3 225 nvm_dev_dma_free(dev->parent, rqd->meta_list, rqd->dma_meta_list);
a4bd217b
JG
226 mempool_free(rqd, pool);
227}
228
229void pblk_bio_free_pages(struct pblk *pblk, struct bio *bio, int off,
230 int nr_pages)
231{
232 struct bio_vec bv;
233 int i;
234
235 WARN_ON(off + nr_pages != bio->bi_vcnt);
236
a4bd217b
JG
237 for (i = off; i < nr_pages + off; i++) {
238 bv = bio->bi_io_vec[i];
bd432417 239 mempool_free(bv.bv_page, pblk->page_bio_pool);
a4bd217b
JG
240 }
241}
242
243int pblk_bio_add_pages(struct pblk *pblk, struct bio *bio, gfp_t flags,
244 int nr_pages)
245{
246 struct request_queue *q = pblk->dev->q;
247 struct page *page;
248 int i, ret;
249
250 for (i = 0; i < nr_pages; i++) {
bd432417 251 page = mempool_alloc(pblk->page_bio_pool, flags);
a4bd217b
JG
252
253 ret = bio_add_pc_page(q, bio, page, PBLK_EXPOSED_PAGE_SIZE, 0);
254 if (ret != PBLK_EXPOSED_PAGE_SIZE) {
255 pr_err("pblk: could not add page to bio\n");
bd432417 256 mempool_free(page, pblk->page_bio_pool);
a4bd217b
JG
257 goto err;
258 }
259 }
260
261 return 0;
262err:
263 pblk_bio_free_pages(pblk, bio, 0, i - 1);
264 return -1;
265}
266
267static void pblk_write_kick(struct pblk *pblk)
268{
269 wake_up_process(pblk->writer_ts);
270 mod_timer(&pblk->wtimer, jiffies + msecs_to_jiffies(1000));
271}
272
87c1d2d3 273void pblk_write_timer_fn(struct timer_list *t)
a4bd217b 274{
87c1d2d3 275 struct pblk *pblk = from_timer(pblk, t, wtimer);
a4bd217b
JG
276
277 /* kick the write thread every tick to flush outstanding data */
278 pblk_write_kick(pblk);
279}
280
281void pblk_write_should_kick(struct pblk *pblk)
282{
283 unsigned int secs_avail = pblk_rb_read_count(&pblk->rwb);
284
285 if (secs_avail >= pblk->min_write_pgs)
286 pblk_write_kick(pblk);
287}
288
a4bd217b
JG
289void pblk_end_io_sync(struct nvm_rq *rqd)
290{
291 struct completion *waiting = rqd->private;
292
293 complete(waiting);
294}
295
8bd40020 296static void pblk_wait_for_meta(struct pblk *pblk)
a4bd217b 297{
588726d3
JG
298 do {
299 if (!atomic_read(&pblk->inflight_io))
300 break;
a4bd217b 301
588726d3
JG
302 schedule();
303 } while (1);
304}
a4bd217b 305
588726d3
JG
306static void pblk_flush_writer(struct pblk *pblk)
307{
308 pblk_rb_flush(&pblk->rwb);
309 do {
ee8d5c1a 310 if (!pblk_rb_sync_count(&pblk->rwb))
588726d3 311 break;
a4bd217b 312
ee8d5c1a 313 pblk_write_kick(pblk);
588726d3
JG
314 schedule();
315 } while (1);
a4bd217b
JG
316}
317
318struct list_head *pblk_line_gc_list(struct pblk *pblk, struct pblk_line *line)
319{
320 struct pblk_line_meta *lm = &pblk->lm;
321 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
322 struct list_head *move_list = NULL;
dd2a4343 323 int vsc = le32_to_cpu(*line->vsc);
a4bd217b 324
476118c9
JG
325 lockdep_assert_held(&line->lock);
326
dd2a4343 327 if (!vsc) {
a4bd217b
JG
328 if (line->gc_group != PBLK_LINEGC_FULL) {
329 line->gc_group = PBLK_LINEGC_FULL;
330 move_list = &l_mg->gc_full_list;
331 }
b20ba1bc 332 } else if (vsc < lm->high_thrs) {
a4bd217b
JG
333 if (line->gc_group != PBLK_LINEGC_HIGH) {
334 line->gc_group = PBLK_LINEGC_HIGH;
335 move_list = &l_mg->gc_high_list;
336 }
b20ba1bc 337 } else if (vsc < lm->mid_thrs) {
a4bd217b
JG
338 if (line->gc_group != PBLK_LINEGC_MID) {
339 line->gc_group = PBLK_LINEGC_MID;
340 move_list = &l_mg->gc_mid_list;
341 }
dd2a4343 342 } else if (vsc < line->sec_in_line) {
a4bd217b
JG
343 if (line->gc_group != PBLK_LINEGC_LOW) {
344 line->gc_group = PBLK_LINEGC_LOW;
345 move_list = &l_mg->gc_low_list;
346 }
dd2a4343 347 } else if (vsc == line->sec_in_line) {
a4bd217b
JG
348 if (line->gc_group != PBLK_LINEGC_EMPTY) {
349 line->gc_group = PBLK_LINEGC_EMPTY;
350 move_list = &l_mg->gc_empty_list;
351 }
352 } else {
353 line->state = PBLK_LINESTATE_CORRUPT;
354 line->gc_group = PBLK_LINEGC_NONE;
355 move_list = &l_mg->corrupt_list;
356 pr_err("pblk: corrupted vsc for line %d, vsc:%d (%d/%d/%d)\n",
dd2a4343 357 line->id, vsc,
a4bd217b
JG
358 line->sec_in_line,
359 lm->high_thrs, lm->mid_thrs);
360 }
361
362 return move_list;
363}
364
365void pblk_discard(struct pblk *pblk, struct bio *bio)
366{
367 sector_t slba = pblk_get_lba(bio);
368 sector_t nr_secs = pblk_get_secs(bio);
369
370 pblk_invalidate_range(pblk, slba, nr_secs);
371}
372
a4bd217b
JG
373void pblk_log_write_err(struct pblk *pblk, struct nvm_rq *rqd)
374{
375 atomic_long_inc(&pblk->write_failed);
376#ifdef CONFIG_NVM_DEBUG
377 pblk_print_failed_rqd(pblk, rqd, rqd->error);
378#endif
379}
380
381void pblk_log_read_err(struct pblk *pblk, struct nvm_rq *rqd)
382{
383 /* Empty page read is not necessarily an error (e.g., L2P recovery) */
384 if (rqd->error == NVM_RSP_ERR_EMPTYPAGE) {
385 atomic_long_inc(&pblk->read_empty);
386 return;
387 }
388
389 switch (rqd->error) {
390 case NVM_RSP_WARN_HIGHECC:
391 atomic_long_inc(&pblk->read_high_ecc);
392 break;
393 case NVM_RSP_ERR_FAILECC:
394 case NVM_RSP_ERR_FAILCRC:
395 atomic_long_inc(&pblk->read_failed);
396 break;
397 default:
398 pr_err("pblk: unknown read error:%d\n", rqd->error);
399 }
400#ifdef CONFIG_NVM_DEBUG
401 pblk_print_failed_rqd(pblk, rqd, rqd->error);
402#endif
403}
404
c2e9f5d4
JG
405void pblk_set_sec_per_write(struct pblk *pblk, int sec_per_write)
406{
407 pblk->sec_per_write = sec_per_write;
408}
409
a4bd217b
JG
410int pblk_submit_io(struct pblk *pblk, struct nvm_rq *rqd)
411{
412 struct nvm_tgt_dev *dev = pblk->dev;
413
414#ifdef CONFIG_NVM_DEBUG
1a94b2d4 415 int ret;
a4bd217b 416
1a94b2d4
JG
417 ret = pblk_check_io(pblk, rqd);
418 if (ret)
419 return ret;
420#endif
a4bd217b 421
1a94b2d4 422 atomic_inc(&pblk->inflight_io);
a4bd217b 423
1a94b2d4
JG
424 return nvm_submit_io(dev, rqd);
425}
a4bd217b 426
1a94b2d4
JG
427int pblk_submit_io_sync(struct pblk *pblk, struct nvm_rq *rqd)
428{
429 struct nvm_tgt_dev *dev = pblk->dev;
430
431#ifdef CONFIG_NVM_DEBUG
432 int ret;
433
434 ret = pblk_check_io(pblk, rqd);
435 if (ret)
436 return ret;
a4bd217b 437#endif
588726d3
JG
438
439 atomic_inc(&pblk->inflight_io);
440
1a94b2d4 441 return nvm_submit_io_sync(dev, rqd);
a4bd217b
JG
442}
443
55e836d4
JG
444static void pblk_bio_map_addr_endio(struct bio *bio)
445{
446 bio_put(bio);
447}
448
a4bd217b
JG
449struct bio *pblk_bio_map_addr(struct pblk *pblk, void *data,
450 unsigned int nr_secs, unsigned int len,
de54e703 451 int alloc_type, gfp_t gfp_mask)
a4bd217b
JG
452{
453 struct nvm_tgt_dev *dev = pblk->dev;
a4bd217b
JG
454 void *kaddr = data;
455 struct page *page;
456 struct bio *bio;
457 int i, ret;
458
de54e703 459 if (alloc_type == PBLK_KMALLOC_META)
a4bd217b
JG
460 return bio_map_kern(dev->q, kaddr, len, gfp_mask);
461
462 bio = bio_kmalloc(gfp_mask, nr_secs);
463 if (!bio)
464 return ERR_PTR(-ENOMEM);
465
466 for (i = 0; i < nr_secs; i++) {
467 page = vmalloc_to_page(kaddr);
468 if (!page) {
469 pr_err("pblk: could not map vmalloc bio\n");
470 bio_put(bio);
471 bio = ERR_PTR(-ENOMEM);
472 goto out;
473 }
474
475 ret = bio_add_pc_page(dev->q, bio, page, PAGE_SIZE, 0);
476 if (ret != PAGE_SIZE) {
477 pr_err("pblk: could not add page to bio\n");
478 bio_put(bio);
479 bio = ERR_PTR(-ENOMEM);
480 goto out;
481 }
482
483 kaddr += PAGE_SIZE;
484 }
55e836d4
JG
485
486 bio->bi_end_io = pblk_bio_map_addr_endio;
a4bd217b
JG
487out:
488 return bio;
489}
490
491int pblk_calc_secs(struct pblk *pblk, unsigned long secs_avail,
492 unsigned long secs_to_flush)
493{
c2e9f5d4 494 int max = pblk->sec_per_write;
a4bd217b
JG
495 int min = pblk->min_write_pgs;
496 int secs_to_sync = 0;
497
498 if (secs_avail >= max)
499 secs_to_sync = max;
500 else if (secs_avail >= min)
501 secs_to_sync = min * (secs_avail / min);
502 else if (secs_to_flush)
503 secs_to_sync = min;
504
505 return secs_to_sync;
506}
507
dd2a4343
JG
508void pblk_dealloc_page(struct pblk *pblk, struct pblk_line *line, int nr_secs)
509{
510 u64 addr;
511 int i;
512
e57903fd 513 spin_lock(&line->lock);
dd2a4343
JG
514 addr = find_next_zero_bit(line->map_bitmap,
515 pblk->lm.sec_per_line, line->cur_sec);
516 line->cur_sec = addr - nr_secs;
517
518 for (i = 0; i < nr_secs; i++, line->cur_sec--)
519 WARN_ON(!test_and_clear_bit(line->cur_sec, line->map_bitmap));
e57903fd 520 spin_unlock(&line->lock);
dd2a4343
JG
521}
522
523u64 __pblk_alloc_page(struct pblk *pblk, struct pblk_line *line, int nr_secs)
a4bd217b
JG
524{
525 u64 addr;
526 int i;
527
476118c9
JG
528 lockdep_assert_held(&line->lock);
529
a4bd217b
JG
530 /* logic error: ppa out-of-bounds. Prevent generating bad address */
531 if (line->cur_sec + nr_secs > pblk->lm.sec_per_line) {
532 WARN(1, "pblk: page allocation out of bounds\n");
533 nr_secs = pblk->lm.sec_per_line - line->cur_sec;
534 }
535
536 line->cur_sec = addr = find_next_zero_bit(line->map_bitmap,
537 pblk->lm.sec_per_line, line->cur_sec);
538 for (i = 0; i < nr_secs; i++, line->cur_sec++)
539 WARN_ON(test_and_set_bit(line->cur_sec, line->map_bitmap));
540
541 return addr;
542}
543
544u64 pblk_alloc_page(struct pblk *pblk, struct pblk_line *line, int nr_secs)
545{
546 u64 addr;
547
548 /* Lock needed in case a write fails and a recovery needs to remap
549 * failed write buffer entries
550 */
551 spin_lock(&line->lock);
552 addr = __pblk_alloc_page(pblk, line, nr_secs);
553 line->left_msecs -= nr_secs;
554 WARN(line->left_msecs < 0, "pblk: page allocation out of bounds\n");
555 spin_unlock(&line->lock);
556
557 return addr;
558}
559
dd2a4343
JG
560u64 pblk_lookup_page(struct pblk *pblk, struct pblk_line *line)
561{
562 u64 paddr;
563
564 spin_lock(&line->lock);
565 paddr = find_next_zero_bit(line->map_bitmap,
566 pblk->lm.sec_per_line, line->cur_sec);
567 spin_unlock(&line->lock);
568
569 return paddr;
570}
571
a4bd217b
JG
572/*
573 * Submit emeta to one LUN in the raid line at the time to avoid a deadlock when
574 * taking the per LUN semaphore.
575 */
576static int pblk_line_submit_emeta_io(struct pblk *pblk, struct pblk_line *line,
dd2a4343 577 void *emeta_buf, u64 paddr, int dir)
a4bd217b
JG
578{
579 struct nvm_tgt_dev *dev = pblk->dev;
580 struct nvm_geo *geo = &dev->geo;
de54e703 581 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
a4bd217b 582 struct pblk_line_meta *lm = &pblk->lm;
63e3809c 583 void *ppa_list, *meta_list;
a4bd217b
JG
584 struct bio *bio;
585 struct nvm_rq rqd;
63e3809c 586 dma_addr_t dma_ppa_list, dma_meta_list;
a4bd217b 587 int min = pblk->min_write_pgs;
dd2a4343 588 int left_ppas = lm->emeta_sec[0];
a4bd217b
JG
589 int id = line->id;
590 int rq_ppas, rq_len;
591 int cmd_op, bio_op;
a4bd217b
JG
592 int i, j;
593 int ret;
a4bd217b 594
e2cddf20 595 if (dir == PBLK_WRITE) {
a4bd217b
JG
596 bio_op = REQ_OP_WRITE;
597 cmd_op = NVM_OP_PWRITE;
e2cddf20 598 } else if (dir == PBLK_READ) {
a4bd217b
JG
599 bio_op = REQ_OP_READ;
600 cmd_op = NVM_OP_PREAD;
a4bd217b
JG
601 } else
602 return -EINVAL;
603
63e3809c
JG
604 meta_list = nvm_dev_dma_alloc(dev->parent, GFP_KERNEL,
605 &dma_meta_list);
606 if (!meta_list)
a4bd217b
JG
607 return -ENOMEM;
608
63e3809c
JG
609 ppa_list = meta_list + pblk_dma_meta_size;
610 dma_ppa_list = dma_meta_list + pblk_dma_meta_size;
611
a4bd217b
JG
612next_rq:
613 memset(&rqd, 0, sizeof(struct nvm_rq));
614
615 rq_ppas = pblk_calc_secs(pblk, left_ppas, 0);
616 rq_len = rq_ppas * geo->sec_size;
617
de54e703
JG
618 bio = pblk_bio_map_addr(pblk, emeta_buf, rq_ppas, rq_len,
619 l_mg->emeta_alloc_type, GFP_KERNEL);
a4bd217b
JG
620 if (IS_ERR(bio)) {
621 ret = PTR_ERR(bio);
622 goto free_rqd_dma;
623 }
624
625 bio->bi_iter.bi_sector = 0; /* internal bio */
626 bio_set_op_attrs(bio, bio_op, 0);
627
628 rqd.bio = bio;
63e3809c 629 rqd.meta_list = meta_list;
a4bd217b 630 rqd.ppa_list = ppa_list;
63e3809c 631 rqd.dma_meta_list = dma_meta_list;
a4bd217b 632 rqd.dma_ppa_list = dma_ppa_list;
63e3809c
JG
633 rqd.opcode = cmd_op;
634 rqd.nr_ppas = rq_ppas;
a4bd217b 635
e2cddf20 636 if (dir == PBLK_WRITE) {
63e3809c
JG
637 struct pblk_sec_meta *meta_list = rqd.meta_list;
638
e2cddf20 639 rqd.flags = pblk_set_progr_mode(pblk, PBLK_WRITE);
a4bd217b
JG
640 for (i = 0; i < rqd.nr_ppas; ) {
641 spin_lock(&line->lock);
642 paddr = __pblk_alloc_page(pblk, line, min);
643 spin_unlock(&line->lock);
63e3809c
JG
644 for (j = 0; j < min; j++, i++, paddr++) {
645 meta_list[i].lba = cpu_to_le64(ADDR_EMPTY);
a4bd217b
JG
646 rqd.ppa_list[i] =
647 addr_to_gen_ppa(pblk, paddr, id);
63e3809c 648 }
a4bd217b
JG
649 }
650 } else {
651 for (i = 0; i < rqd.nr_ppas; ) {
652 struct ppa_addr ppa = addr_to_gen_ppa(pblk, paddr, id);
b1bcfda1 653 int pos = pblk_ppa_to_pos(geo, ppa);
f9c10152
JG
654 int read_type = PBLK_READ_RANDOM;
655
656 if (pblk_io_aligned(pblk, rq_ppas))
657 read_type = PBLK_READ_SEQUENTIAL;
658 rqd.flags = pblk_set_read_mode(pblk, read_type);
a4bd217b
JG
659
660 while (test_bit(pos, line->blk_bitmap)) {
661 paddr += min;
662 if (pblk_boundary_paddr_checks(pblk, paddr)) {
663 pr_err("pblk: corrupt emeta line:%d\n",
664 line->id);
665 bio_put(bio);
666 ret = -EINTR;
667 goto free_rqd_dma;
668 }
669
670 ppa = addr_to_gen_ppa(pblk, paddr, id);
b1bcfda1 671 pos = pblk_ppa_to_pos(geo, ppa);
a4bd217b
JG
672 }
673
674 if (pblk_boundary_paddr_checks(pblk, paddr + min)) {
675 pr_err("pblk: corrupt emeta line:%d\n",
676 line->id);
677 bio_put(bio);
678 ret = -EINTR;
679 goto free_rqd_dma;
680 }
681
682 for (j = 0; j < min; j++, i++, paddr++)
683 rqd.ppa_list[i] =
684 addr_to_gen_ppa(pblk, paddr, line->id);
685 }
686 }
687
1a94b2d4 688 ret = pblk_submit_io_sync(pblk, &rqd);
a4bd217b
JG
689 if (ret) {
690 pr_err("pblk: emeta I/O submission failed: %d\n", ret);
691 bio_put(bio);
692 goto free_rqd_dma;
693 }
694
588726d3 695 atomic_dec(&pblk->inflight_io);
a4bd217b 696
a4bd217b 697 if (rqd.error) {
e2cddf20 698 if (dir == PBLK_WRITE)
a4bd217b
JG
699 pblk_log_write_err(pblk, &rqd);
700 else
701 pblk_log_read_err(pblk, &rqd);
702 }
703
dd2a4343 704 emeta_buf += rq_len;
a4bd217b
JG
705 left_ppas -= rq_ppas;
706 if (left_ppas)
707 goto next_rq;
708free_rqd_dma:
63e3809c 709 nvm_dev_dma_free(dev->parent, rqd.meta_list, rqd.dma_meta_list);
a4bd217b
JG
710 return ret;
711}
712
713u64 pblk_line_smeta_start(struct pblk *pblk, struct pblk_line *line)
714{
715 struct nvm_tgt_dev *dev = pblk->dev;
716 struct nvm_geo *geo = &dev->geo;
717 struct pblk_line_meta *lm = &pblk->lm;
718 int bit;
719
720 /* This usually only happens on bad lines */
721 bit = find_first_zero_bit(line->blk_bitmap, lm->blk_per_line);
722 if (bit >= lm->blk_per_line)
723 return -1;
724
725 return bit * geo->sec_per_pl;
726}
727
728static int pblk_line_submit_smeta_io(struct pblk *pblk, struct pblk_line *line,
729 u64 paddr, int dir)
730{
731 struct nvm_tgt_dev *dev = pblk->dev;
732 struct pblk_line_meta *lm = &pblk->lm;
733 struct bio *bio;
734 struct nvm_rq rqd;
735 __le64 *lba_list = NULL;
736 int i, ret;
737 int cmd_op, bio_op;
738 int flags;
a4bd217b 739
e2cddf20 740 if (dir == PBLK_WRITE) {
a4bd217b
JG
741 bio_op = REQ_OP_WRITE;
742 cmd_op = NVM_OP_PWRITE;
e2cddf20 743 flags = pblk_set_progr_mode(pblk, PBLK_WRITE);
dd2a4343 744 lba_list = emeta_to_lbas(pblk, line->emeta->buf);
8f554597 745 } else if (dir == PBLK_READ_RECOV || dir == PBLK_READ) {
a4bd217b
JG
746 bio_op = REQ_OP_READ;
747 cmd_op = NVM_OP_PREAD;
f9c10152 748 flags = pblk_set_read_mode(pblk, PBLK_READ_SEQUENTIAL);
a4bd217b
JG
749 } else
750 return -EINVAL;
751
752 memset(&rqd, 0, sizeof(struct nvm_rq));
753
63e3809c
JG
754 rqd.meta_list = nvm_dev_dma_alloc(dev->parent, GFP_KERNEL,
755 &rqd.dma_meta_list);
756 if (!rqd.meta_list)
a4bd217b
JG
757 return -ENOMEM;
758
63e3809c
JG
759 rqd.ppa_list = rqd.meta_list + pblk_dma_meta_size;
760 rqd.dma_ppa_list = rqd.dma_meta_list + pblk_dma_meta_size;
761
a4bd217b
JG
762 bio = bio_map_kern(dev->q, line->smeta, lm->smeta_len, GFP_KERNEL);
763 if (IS_ERR(bio)) {
764 ret = PTR_ERR(bio);
765 goto free_ppa_list;
766 }
767
768 bio->bi_iter.bi_sector = 0; /* internal bio */
769 bio_set_op_attrs(bio, bio_op, 0);
770
771 rqd.bio = bio;
772 rqd.opcode = cmd_op;
773 rqd.flags = flags;
774 rqd.nr_ppas = lm->smeta_sec;
a4bd217b
JG
775
776 for (i = 0; i < lm->smeta_sec; i++, paddr++) {
63e3809c
JG
777 struct pblk_sec_meta *meta_list = rqd.meta_list;
778
a4bd217b 779 rqd.ppa_list[i] = addr_to_gen_ppa(pblk, paddr, line->id);
63e3809c 780
e2cddf20 781 if (dir == PBLK_WRITE) {
f417aa0b 782 __le64 addr_empty = cpu_to_le64(ADDR_EMPTY);
63e3809c
JG
783
784 meta_list[i].lba = lba_list[paddr] = addr_empty;
785 }
a4bd217b
JG
786 }
787
788 /*
789 * This I/O is sent by the write thread when a line is replace. Since
790 * the write thread is the only one sending write and erase commands,
791 * there is no need to take the LUN semaphore.
792 */
1a94b2d4 793 ret = pblk_submit_io_sync(pblk, &rqd);
a4bd217b
JG
794 if (ret) {
795 pr_err("pblk: smeta I/O submission failed: %d\n", ret);
796 bio_put(bio);
797 goto free_ppa_list;
798 }
799
588726d3 800 atomic_dec(&pblk->inflight_io);
a4bd217b
JG
801
802 if (rqd.error) {
e2cddf20 803 if (dir == PBLK_WRITE)
a4bd217b 804 pblk_log_write_err(pblk, &rqd);
8f554597 805 else if (dir == PBLK_READ)
a4bd217b
JG
806 pblk_log_read_err(pblk, &rqd);
807 }
808
809free_ppa_list:
63e3809c 810 nvm_dev_dma_free(dev->parent, rqd.meta_list, rqd.dma_meta_list);
a4bd217b
JG
811
812 return ret;
813}
814
815int pblk_line_read_smeta(struct pblk *pblk, struct pblk_line *line)
816{
817 u64 bpaddr = pblk_line_smeta_start(pblk, line);
818
8f554597 819 return pblk_line_submit_smeta_io(pblk, line, bpaddr, PBLK_READ_RECOV);
a4bd217b
JG
820}
821
dd2a4343
JG
822int pblk_line_read_emeta(struct pblk *pblk, struct pblk_line *line,
823 void *emeta_buf)
a4bd217b 824{
dd2a4343 825 return pblk_line_submit_emeta_io(pblk, line, emeta_buf,
e2cddf20 826 line->emeta_ssec, PBLK_READ);
a4bd217b
JG
827}
828
829static void pblk_setup_e_rq(struct pblk *pblk, struct nvm_rq *rqd,
830 struct ppa_addr ppa)
831{
832 rqd->opcode = NVM_OP_ERASE;
833 rqd->ppa_addr = ppa;
834 rqd->nr_ppas = 1;
e2cddf20 835 rqd->flags = pblk_set_progr_mode(pblk, PBLK_ERASE);
a4bd217b
JG
836 rqd->bio = NULL;
837}
838
839static int pblk_blk_erase_sync(struct pblk *pblk, struct ppa_addr ppa)
840{
841 struct nvm_rq rqd;
588726d3 842 int ret = 0;
a4bd217b
JG
843
844 memset(&rqd, 0, sizeof(struct nvm_rq));
845
846 pblk_setup_e_rq(pblk, &rqd, ppa);
847
a4bd217b
JG
848 /* The write thread schedules erases so that it minimizes disturbances
849 * with writes. Thus, there is no need to take the LUN semaphore.
850 */
1a94b2d4 851 ret = pblk_submit_io_sync(pblk, &rqd);
a4bd217b
JG
852 if (ret) {
853 struct nvm_tgt_dev *dev = pblk->dev;
854 struct nvm_geo *geo = &dev->geo;
855
856 pr_err("pblk: could not sync erase line:%d,blk:%d\n",
b1bcfda1
JG
857 pblk_ppa_to_line(ppa),
858 pblk_ppa_to_pos(geo, ppa));
a4bd217b
JG
859
860 rqd.error = ret;
861 goto out;
862 }
863
a4bd217b
JG
864out:
865 rqd.private = pblk;
866 __pblk_end_io_erase(pblk, &rqd);
867
588726d3 868 return ret;
a4bd217b
JG
869}
870
871int pblk_line_erase(struct pblk *pblk, struct pblk_line *line)
872{
873 struct pblk_line_meta *lm = &pblk->lm;
874 struct ppa_addr ppa;
588726d3 875 int ret, bit = -1;
a4bd217b 876
a44f53fa
JG
877 /* Erase only good blocks, one at a time */
878 do {
879 spin_lock(&line->lock);
880 bit = find_next_zero_bit(line->erase_bitmap, lm->blk_per_line,
881 bit + 1);
882 if (bit >= lm->blk_per_line) {
883 spin_unlock(&line->lock);
884 break;
885 }
886
a4bd217b
JG
887 ppa = pblk->luns[bit].bppa; /* set ch and lun */
888 ppa.g.blk = line->id;
889
a44f53fa 890 atomic_dec(&line->left_eblks);
a4bd217b 891 WARN_ON(test_and_set_bit(bit, line->erase_bitmap));
a44f53fa 892 spin_unlock(&line->lock);
a4bd217b 893
588726d3
JG
894 ret = pblk_blk_erase_sync(pblk, ppa);
895 if (ret) {
a4bd217b 896 pr_err("pblk: failed to erase line %d\n", line->id);
588726d3 897 return ret;
a4bd217b 898 }
a44f53fa 899 } while (1);
a4bd217b
JG
900
901 return 0;
902}
903
dd2a4343
JG
904static void pblk_line_setup_metadata(struct pblk_line *line,
905 struct pblk_line_mgmt *l_mg,
906 struct pblk_line_meta *lm)
907{
908 int meta_line;
909
588726d3
JG
910 lockdep_assert_held(&l_mg->free_lock);
911
dd2a4343
JG
912retry_meta:
913 meta_line = find_first_zero_bit(&l_mg->meta_bitmap, PBLK_DATA_LINES);
914 if (meta_line == PBLK_DATA_LINES) {
915 spin_unlock(&l_mg->free_lock);
916 io_schedule();
917 spin_lock(&l_mg->free_lock);
918 goto retry_meta;
919 }
920
921 set_bit(meta_line, &l_mg->meta_bitmap);
922 line->meta_line = meta_line;
923
924 line->smeta = l_mg->sline_meta[meta_line];
925 line->emeta = l_mg->eline_meta[meta_line];
926
927 memset(line->smeta, 0, lm->smeta_len);
928 memset(line->emeta->buf, 0, lm->emeta_len[0]);
929
930 line->emeta->mem = 0;
931 atomic_set(&line->emeta->sync, 0);
932}
933
a4bd217b
JG
934/* For now lines are always assumed full lines. Thus, smeta former and current
935 * lun bitmaps are omitted.
936 */
dd2a4343 937static int pblk_line_init_metadata(struct pblk *pblk, struct pblk_line *line,
a4bd217b
JG
938 struct pblk_line *cur)
939{
940 struct nvm_tgt_dev *dev = pblk->dev;
941 struct nvm_geo *geo = &dev->geo;
942 struct pblk_line_meta *lm = &pblk->lm;
943 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
dd2a4343
JG
944 struct pblk_emeta *emeta = line->emeta;
945 struct line_emeta *emeta_buf = emeta->buf;
946 struct line_smeta *smeta_buf = (struct line_smeta *)line->smeta;
a4bd217b
JG
947 int nr_blk_line;
948
949 /* After erasing the line, new bad blocks might appear and we risk
950 * having an invalid line
951 */
952 nr_blk_line = lm->blk_per_line -
953 bitmap_weight(line->blk_bitmap, lm->blk_per_line);
954 if (nr_blk_line < lm->min_blk_line) {
955 spin_lock(&l_mg->free_lock);
956 spin_lock(&line->lock);
957 line->state = PBLK_LINESTATE_BAD;
958 spin_unlock(&line->lock);
959
960 list_add_tail(&line->list, &l_mg->bad_list);
961 spin_unlock(&l_mg->free_lock);
962
963 pr_debug("pblk: line %d is bad\n", line->id);
964
965 return 0;
966 }
967
968 /* Run-time metadata */
dd2a4343 969 line->lun_bitmap = ((void *)(smeta_buf)) + sizeof(struct line_smeta);
a4bd217b
JG
970
971 /* Mark LUNs allocated in this line (all for now) */
972 bitmap_set(line->lun_bitmap, 0, lm->lun_bitmap_len);
973
dd2a4343
JG
974 smeta_buf->header.identifier = cpu_to_le32(PBLK_MAGIC);
975 memcpy(smeta_buf->header.uuid, pblk->instance_uuid, 16);
976 smeta_buf->header.id = cpu_to_le32(line->id);
977 smeta_buf->header.type = cpu_to_le16(line->type);
d0ab0b1a
HH
978 smeta_buf->header.version_major = SMETA_VERSION_MAJOR;
979 smeta_buf->header.version_minor = SMETA_VERSION_MINOR;
a4bd217b
JG
980
981 /* Start metadata */
dd2a4343 982 smeta_buf->seq_nr = cpu_to_le64(line->seq_nr);
fae7fae4 983 smeta_buf->window_wr_lun = cpu_to_le32(geo->all_luns);
a4bd217b
JG
984
985 /* Fill metadata among lines */
986 if (cur) {
987 memcpy(line->lun_bitmap, cur->lun_bitmap, lm->lun_bitmap_len);
dd2a4343
JG
988 smeta_buf->prev_id = cpu_to_le32(cur->id);
989 cur->emeta->buf->next_id = cpu_to_le32(line->id);
a4bd217b 990 } else {
dd2a4343 991 smeta_buf->prev_id = cpu_to_le32(PBLK_LINE_EMPTY);
a4bd217b
JG
992 }
993
994 /* All smeta must be set at this point */
dd2a4343
JG
995 smeta_buf->header.crc = cpu_to_le32(
996 pblk_calc_meta_header_crc(pblk, &smeta_buf->header));
997 smeta_buf->crc = cpu_to_le32(pblk_calc_smeta_crc(pblk, smeta_buf));
a4bd217b
JG
998
999 /* End metadata */
dd2a4343
JG
1000 memcpy(&emeta_buf->header, &smeta_buf->header,
1001 sizeof(struct line_header));
d0ab0b1a
HH
1002
1003 emeta_buf->header.version_major = EMETA_VERSION_MAJOR;
1004 emeta_buf->header.version_minor = EMETA_VERSION_MINOR;
1005 emeta_buf->header.crc = cpu_to_le32(
1006 pblk_calc_meta_header_crc(pblk, &emeta_buf->header));
1007
dd2a4343
JG
1008 emeta_buf->seq_nr = cpu_to_le64(line->seq_nr);
1009 emeta_buf->nr_lbas = cpu_to_le64(line->sec_in_line);
1010 emeta_buf->nr_valid_lbas = cpu_to_le64(0);
1011 emeta_buf->next_id = cpu_to_le32(PBLK_LINE_EMPTY);
1012 emeta_buf->crc = cpu_to_le32(0);
1013 emeta_buf->prev_id = smeta_buf->prev_id;
a4bd217b
JG
1014
1015 return 1;
1016}
1017
1018/* For now lines are always assumed full lines. Thus, smeta former and current
1019 * lun bitmaps are omitted.
1020 */
1021static int pblk_line_init_bb(struct pblk *pblk, struct pblk_line *line,
1022 int init)
1023{
1024 struct nvm_tgt_dev *dev = pblk->dev;
1025 struct nvm_geo *geo = &dev->geo;
1026 struct pblk_line_meta *lm = &pblk->lm;
1027 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
a4bd217b
JG
1028 u64 off;
1029 int bit = -1;
cfe1c9e2 1030 int emeta_secs;
a4bd217b
JG
1031
1032 line->sec_in_line = lm->sec_per_line;
1033
1034 /* Capture bad block information on line mapping bitmaps */
1035 while ((bit = find_next_bit(line->blk_bitmap, lm->blk_per_line,
1036 bit + 1)) < lm->blk_per_line) {
1037 off = bit * geo->sec_per_pl;
1038 bitmap_shift_left(l_mg->bb_aux, l_mg->bb_template, off,
1039 lm->sec_per_line);
1040 bitmap_or(line->map_bitmap, line->map_bitmap, l_mg->bb_aux,
1041 lm->sec_per_line);
fae7fae4 1042 line->sec_in_line -= geo->sec_per_chk;
a4bd217b
JG
1043 }
1044
1045 /* Mark smeta metadata sectors as bad sectors */
1046 bit = find_first_zero_bit(line->blk_bitmap, lm->blk_per_line);
1047 off = bit * geo->sec_per_pl;
a4bd217b
JG
1048 bitmap_set(line->map_bitmap, off, lm->smeta_sec);
1049 line->sec_in_line -= lm->smeta_sec;
1050 line->smeta_ssec = off;
1051 line->cur_sec = off + lm->smeta_sec;
1052
e2cddf20 1053 if (init && pblk_line_submit_smeta_io(pblk, line, off, PBLK_WRITE)) {
a4bd217b 1054 pr_debug("pblk: line smeta I/O failed. Retry\n");
588726d3 1055 return 1;
a4bd217b
JG
1056 }
1057
1058 bitmap_copy(line->invalid_bitmap, line->map_bitmap, lm->sec_per_line);
1059
1060 /* Mark emeta metadata sectors as bad sectors. We need to consider bad
1061 * blocks to make sure that there are enough sectors to store emeta
1062 */
cfe1c9e2
HH
1063 emeta_secs = lm->emeta_sec[0];
1064 off = lm->sec_per_line;
1065 while (emeta_secs) {
a4bd217b
JG
1066 off -= geo->sec_per_pl;
1067 if (!test_bit(off, line->invalid_bitmap)) {
1068 bitmap_set(line->invalid_bitmap, off, geo->sec_per_pl);
cfe1c9e2 1069 emeta_secs -= geo->sec_per_pl;
a4bd217b
JG
1070 }
1071 }
1072
a4bd217b 1073 line->emeta_ssec = off;
cfe1c9e2 1074 line->sec_in_line -= lm->emeta_sec[0];
dd2a4343 1075 line->nr_valid_lbas = 0;
0880a9aa 1076 line->left_msecs = line->sec_in_line;
dd2a4343 1077 *line->vsc = cpu_to_le32(line->sec_in_line);
a4bd217b
JG
1078
1079 if (lm->sec_per_line - line->sec_in_line !=
1080 bitmap_weight(line->invalid_bitmap, lm->sec_per_line)) {
1081 spin_lock(&line->lock);
1082 line->state = PBLK_LINESTATE_BAD;
1083 spin_unlock(&line->lock);
1084
1085 list_add_tail(&line->list, &l_mg->bad_list);
1086 pr_err("pblk: unexpected line %d is bad\n", line->id);
1087
1088 return 0;
1089 }
1090
1091 return 1;
1092}
1093
1094static int pblk_line_prepare(struct pblk *pblk, struct pblk_line *line)
1095{
1096 struct pblk_line_meta *lm = &pblk->lm;
a44f53fa 1097 int blk_in_line = atomic_read(&line->blk_in_line);
a4bd217b 1098
e72ec1d3 1099 line->map_bitmap = kzalloc(lm->sec_bitmap_len, GFP_ATOMIC);
a4bd217b
JG
1100 if (!line->map_bitmap)
1101 return -ENOMEM;
a4bd217b 1102
e72ec1d3
JG
1103 /* will be initialized using bb info from map_bitmap */
1104 line->invalid_bitmap = kmalloc(lm->sec_bitmap_len, GFP_ATOMIC);
a4bd217b 1105 if (!line->invalid_bitmap) {
e72ec1d3 1106 kfree(line->map_bitmap);
a4bd217b
JG
1107 return -ENOMEM;
1108 }
1109
1110 spin_lock(&line->lock);
1111 if (line->state != PBLK_LINESTATE_FREE) {
e72ec1d3
JG
1112 kfree(line->map_bitmap);
1113 kfree(line->invalid_bitmap);
a4bd217b 1114 spin_unlock(&line->lock);
588726d3
JG
1115 WARN(1, "pblk: corrupted line %d, state %d\n",
1116 line->id, line->state);
1117 return -EAGAIN;
a4bd217b 1118 }
588726d3 1119
a4bd217b 1120 line->state = PBLK_LINESTATE_OPEN;
a44f53fa
JG
1121
1122 atomic_set(&line->left_eblks, blk_in_line);
1123 atomic_set(&line->left_seblks, blk_in_line);
dd2a4343
JG
1124
1125 line->meta_distance = lm->meta_distance;
a4bd217b
JG
1126 spin_unlock(&line->lock);
1127
1128 /* Bad blocks do not need to be erased */
1129 bitmap_copy(line->erase_bitmap, line->blk_bitmap, lm->blk_per_line);
a4bd217b
JG
1130
1131 kref_init(&line->ref);
1132
1133 return 0;
1134}
1135
1136int pblk_line_recov_alloc(struct pblk *pblk, struct pblk_line *line)
1137{
1138 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1139 int ret;
1140
1141 spin_lock(&l_mg->free_lock);
1142 l_mg->data_line = line;
1143 list_del(&line->list);
a4bd217b
JG
1144
1145 ret = pblk_line_prepare(pblk, line);
1146 if (ret) {
1147 list_add(&line->list, &l_mg->free_list);
3dc001f3 1148 spin_unlock(&l_mg->free_lock);
a4bd217b
JG
1149 return ret;
1150 }
3dc001f3 1151 spin_unlock(&l_mg->free_lock);
a4bd217b 1152
a7689938 1153 pblk_rl_free_lines_dec(&pblk->rl, line, true);
a4bd217b
JG
1154
1155 if (!pblk_line_init_bb(pblk, line, 0)) {
1156 list_add(&line->list, &l_mg->free_list);
1157 return -EINTR;
1158 }
1159
1160 return 0;
1161}
1162
1163void pblk_line_recov_close(struct pblk *pblk, struct pblk_line *line)
1164{
e72ec1d3 1165 kfree(line->map_bitmap);
a4bd217b
JG
1166 line->map_bitmap = NULL;
1167 line->smeta = NULL;
1168 line->emeta = NULL;
1169}
1170
1171struct pblk_line *pblk_line_get(struct pblk *pblk)
1172{
1173 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1174 struct pblk_line_meta *lm = &pblk->lm;
588726d3
JG
1175 struct pblk_line *line;
1176 int ret, bit;
a4bd217b
JG
1177
1178 lockdep_assert_held(&l_mg->free_lock);
1179
588726d3 1180retry:
a4bd217b
JG
1181 if (list_empty(&l_mg->free_list)) {
1182 pr_err("pblk: no free lines\n");
588726d3 1183 return NULL;
a4bd217b
JG
1184 }
1185
1186 line = list_first_entry(&l_mg->free_list, struct pblk_line, list);
1187 list_del(&line->list);
1188 l_mg->nr_free_lines--;
1189
1190 bit = find_first_zero_bit(line->blk_bitmap, lm->blk_per_line);
1191 if (unlikely(bit >= lm->blk_per_line)) {
1192 spin_lock(&line->lock);
1193 line->state = PBLK_LINESTATE_BAD;
1194 spin_unlock(&line->lock);
1195
1196 list_add_tail(&line->list, &l_mg->bad_list);
1197
1198 pr_debug("pblk: line %d is bad\n", line->id);
588726d3 1199 goto retry;
a4bd217b
JG
1200 }
1201
588726d3
JG
1202 ret = pblk_line_prepare(pblk, line);
1203 if (ret) {
1204 if (ret == -EAGAIN) {
1205 list_add(&line->list, &l_mg->corrupt_list);
1206 goto retry;
1207 } else {
1208 pr_err("pblk: failed to prepare line %d\n", line->id);
1209 list_add(&line->list, &l_mg->free_list);
1210 l_mg->nr_free_lines++;
1211 return NULL;
1212 }
a4bd217b
JG
1213 }
1214
a4bd217b
JG
1215 return line;
1216}
1217
1218static struct pblk_line *pblk_line_retry(struct pblk *pblk,
1219 struct pblk_line *line)
1220{
1221 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1222 struct pblk_line *retry_line;
1223
588726d3 1224retry:
a4bd217b
JG
1225 spin_lock(&l_mg->free_lock);
1226 retry_line = pblk_line_get(pblk);
1227 if (!retry_line) {
be388d9f 1228 l_mg->data_line = NULL;
a4bd217b
JG
1229 spin_unlock(&l_mg->free_lock);
1230 return NULL;
1231 }
1232
1233 retry_line->smeta = line->smeta;
1234 retry_line->emeta = line->emeta;
1235 retry_line->meta_line = line->meta_line;
a4bd217b 1236
be388d9f 1237 pblk_line_free(pblk, line);
3dc001f3 1238 l_mg->data_line = retry_line;
a4bd217b
JG
1239 spin_unlock(&l_mg->free_lock);
1240
a7689938 1241 pblk_rl_free_lines_dec(&pblk->rl, line, false);
a4bd217b 1242
588726d3
JG
1243 if (pblk_line_erase(pblk, retry_line))
1244 goto retry;
1245
a4bd217b
JG
1246 return retry_line;
1247}
1248
588726d3
JG
1249static void pblk_set_space_limit(struct pblk *pblk)
1250{
1251 struct pblk_rl *rl = &pblk->rl;
1252
1253 atomic_set(&rl->rb_space, 0);
1254}
1255
a4bd217b
JG
1256struct pblk_line *pblk_line_get_first_data(struct pblk *pblk)
1257{
1258 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1259 struct pblk_line *line;
a4bd217b
JG
1260
1261 spin_lock(&l_mg->free_lock);
1262 line = pblk_line_get(pblk);
1263 if (!line) {
1264 spin_unlock(&l_mg->free_lock);
1265 return NULL;
1266 }
1267
1268 line->seq_nr = l_mg->d_seq_nr++;
1269 line->type = PBLK_LINETYPE_DATA;
1270 l_mg->data_line = line;
1271
dd2a4343 1272 pblk_line_setup_metadata(line, l_mg, &pblk->lm);
a4bd217b
JG
1273
1274 /* Allocate next line for preparation */
1275 l_mg->data_next = pblk_line_get(pblk);
588726d3
JG
1276 if (!l_mg->data_next) {
1277 /* If we cannot get a new line, we need to stop the pipeline.
1278 * Only allow as many writes in as we can store safely and then
1279 * fail gracefully
1280 */
1281 pblk_set_space_limit(pblk);
1282
1283 l_mg->data_next = NULL;
1284 } else {
a4bd217b
JG
1285 l_mg->data_next->seq_nr = l_mg->d_seq_nr++;
1286 l_mg->data_next->type = PBLK_LINETYPE_DATA;
a4bd217b
JG
1287 }
1288 spin_unlock(&l_mg->free_lock);
1289
588726d3
JG
1290 if (pblk_line_erase(pblk, line)) {
1291 line = pblk_line_retry(pblk, line);
1292 if (!line)
1293 return NULL;
1294 }
1295
a4bd217b 1296retry_setup:
dd2a4343 1297 if (!pblk_line_init_metadata(pblk, line, NULL)) {
a4bd217b
JG
1298 line = pblk_line_retry(pblk, line);
1299 if (!line)
1300 return NULL;
1301
1302 goto retry_setup;
1303 }
1304
1305 if (!pblk_line_init_bb(pblk, line, 1)) {
1306 line = pblk_line_retry(pblk, line);
1307 if (!line)
1308 return NULL;
1309
1310 goto retry_setup;
1311 }
1312
a7689938
JG
1313 pblk_rl_free_lines_dec(&pblk->rl, line, true);
1314
a4bd217b
JG
1315 return line;
1316}
1317
588726d3
JG
1318static void pblk_stop_writes(struct pblk *pblk, struct pblk_line *line)
1319{
1320 lockdep_assert_held(&pblk->l_mg.free_lock);
1321
1322 pblk_set_space_limit(pblk);
1323 pblk->state = PBLK_STATE_STOPPING;
1324}
1325
8bd40020
JG
1326static void pblk_line_close_meta_sync(struct pblk *pblk)
1327{
1328 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1329 struct pblk_line_meta *lm = &pblk->lm;
1330 struct pblk_line *line, *tline;
1331 LIST_HEAD(list);
1332
1333 spin_lock(&l_mg->close_lock);
1334 if (list_empty(&l_mg->emeta_list)) {
1335 spin_unlock(&l_mg->close_lock);
1336 return;
1337 }
1338
1339 list_cut_position(&list, &l_mg->emeta_list, l_mg->emeta_list.prev);
1340 spin_unlock(&l_mg->close_lock);
1341
1342 list_for_each_entry_safe(line, tline, &list, list) {
1343 struct pblk_emeta *emeta = line->emeta;
1344
1345 while (emeta->mem < lm->emeta_len[0]) {
1346 int ret;
1347
1348 ret = pblk_submit_meta_io(pblk, line);
1349 if (ret) {
1350 pr_err("pblk: sync meta line %d failed (%d)\n",
1351 line->id, ret);
1352 return;
1353 }
1354 }
1355 }
1356
1357 pblk_wait_for_meta(pblk);
1358 flush_workqueue(pblk->close_wq);
1359}
1360
588726d3
JG
1361void pblk_pipeline_stop(struct pblk *pblk)
1362{
1363 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1364 int ret;
1365
1366 spin_lock(&l_mg->free_lock);
1367 if (pblk->state == PBLK_STATE_RECOVERING ||
1368 pblk->state == PBLK_STATE_STOPPED) {
1369 spin_unlock(&l_mg->free_lock);
1370 return;
1371 }
1372 pblk->state = PBLK_STATE_RECOVERING;
1373 spin_unlock(&l_mg->free_lock);
1374
1375 pblk_flush_writer(pblk);
1376 pblk_wait_for_meta(pblk);
1377
1378 ret = pblk_recov_pad(pblk);
1379 if (ret) {
1380 pr_err("pblk: could not close data on teardown(%d)\n", ret);
1381 return;
1382 }
1383
ee8d5c1a 1384 flush_workqueue(pblk->bb_wq);
588726d3
JG
1385 pblk_line_close_meta_sync(pblk);
1386
1387 spin_lock(&l_mg->free_lock);
1388 pblk->state = PBLK_STATE_STOPPED;
1389 l_mg->data_line = NULL;
1390 l_mg->data_next = NULL;
1391 spin_unlock(&l_mg->free_lock);
1392}
1393
21d22871 1394struct pblk_line *pblk_line_replace_data(struct pblk *pblk)
a4bd217b 1395{
a4bd217b 1396 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
21d22871 1397 struct pblk_line *cur, *new = NULL;
a4bd217b 1398 unsigned int left_seblks;
a4bd217b
JG
1399
1400 cur = l_mg->data_line;
1401 new = l_mg->data_next;
1402 if (!new)
21d22871 1403 goto out;
a4bd217b
JG
1404 l_mg->data_line = new;
1405
588726d3 1406 spin_lock(&l_mg->free_lock);
588726d3
JG
1407 pblk_line_setup_metadata(new, l_mg, &pblk->lm);
1408 spin_unlock(&l_mg->free_lock);
1409
1410retry_erase:
a4bd217b
JG
1411 left_seblks = atomic_read(&new->left_seblks);
1412 if (left_seblks) {
1413 /* If line is not fully erased, erase it */
a44f53fa 1414 if (atomic_read(&new->left_eblks)) {
a4bd217b 1415 if (pblk_line_erase(pblk, new))
21d22871 1416 goto out;
a4bd217b
JG
1417 } else {
1418 io_schedule();
1419 }
588726d3 1420 goto retry_erase;
a4bd217b
JG
1421 }
1422
a4bd217b 1423retry_setup:
dd2a4343 1424 if (!pblk_line_init_metadata(pblk, new, cur)) {
a4bd217b 1425 new = pblk_line_retry(pblk, new);
f3236cef 1426 if (!new)
21d22871 1427 goto out;
a4bd217b
JG
1428
1429 goto retry_setup;
1430 }
1431
1432 if (!pblk_line_init_bb(pblk, new, 1)) {
1433 new = pblk_line_retry(pblk, new);
1434 if (!new)
21d22871 1435 goto out;
a4bd217b
JG
1436
1437 goto retry_setup;
1438 }
1439
a7689938
JG
1440 pblk_rl_free_lines_dec(&pblk->rl, new, true);
1441
588726d3
JG
1442 /* Allocate next line for preparation */
1443 spin_lock(&l_mg->free_lock);
1444 l_mg->data_next = pblk_line_get(pblk);
1445 if (!l_mg->data_next) {
1446 /* If we cannot get a new line, we need to stop the pipeline.
1447 * Only allow as many writes in as we can store safely and then
1448 * fail gracefully
1449 */
1450 pblk_stop_writes(pblk, new);
1451 l_mg->data_next = NULL;
1452 } else {
1453 l_mg->data_next->seq_nr = l_mg->d_seq_nr++;
1454 l_mg->data_next->type = PBLK_LINETYPE_DATA;
588726d3
JG
1455 }
1456 spin_unlock(&l_mg->free_lock);
1457
21d22871
JG
1458out:
1459 return new;
a4bd217b
JG
1460}
1461
1462void pblk_line_free(struct pblk *pblk, struct pblk_line *line)
1463{
e72ec1d3
JG
1464 kfree(line->map_bitmap);
1465 kfree(line->invalid_bitmap);
a4bd217b 1466
dd2a4343
JG
1467 *line->vsc = cpu_to_le32(EMPTY_ENTRY);
1468
a4bd217b
JG
1469 line->map_bitmap = NULL;
1470 line->invalid_bitmap = NULL;
be388d9f
JG
1471 line->smeta = NULL;
1472 line->emeta = NULL;
a4bd217b
JG
1473}
1474
7bd4d370 1475static void __pblk_line_put(struct pblk *pblk, struct pblk_line *line)
a4bd217b 1476{
a4bd217b 1477 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
d6b992f7 1478 struct pblk_gc *gc = &pblk->gc;
a4bd217b
JG
1479
1480 spin_lock(&line->lock);
1481 WARN_ON(line->state != PBLK_LINESTATE_GC);
1482 line->state = PBLK_LINESTATE_FREE;
1483 line->gc_group = PBLK_LINEGC_NONE;
1484 pblk_line_free(pblk, line);
1485 spin_unlock(&line->lock);
1486
d6b992f7
HH
1487 atomic_dec(&gc->pipeline_gc);
1488
a4bd217b
JG
1489 spin_lock(&l_mg->free_lock);
1490 list_add_tail(&line->list, &l_mg->free_list);
1491 l_mg->nr_free_lines++;
1492 spin_unlock(&l_mg->free_lock);
1493
1494 pblk_rl_free_lines_inc(&pblk->rl, line);
1495}
1496
7bd4d370
JG
1497static void pblk_line_put_ws(struct work_struct *work)
1498{
1499 struct pblk_line_ws *line_put_ws = container_of(work,
1500 struct pblk_line_ws, ws);
1501 struct pblk *pblk = line_put_ws->pblk;
1502 struct pblk_line *line = line_put_ws->line;
1503
1504 __pblk_line_put(pblk, line);
1505 mempool_free(line_put_ws, pblk->gen_ws_pool);
1506}
1507
1508void pblk_line_put(struct kref *ref)
1509{
1510 struct pblk_line *line = container_of(ref, struct pblk_line, ref);
1511 struct pblk *pblk = line->pblk;
1512
1513 __pblk_line_put(pblk, line);
1514}
1515
1516void pblk_line_put_wq(struct kref *ref)
1517{
1518 struct pblk_line *line = container_of(ref, struct pblk_line, ref);
1519 struct pblk *pblk = line->pblk;
1520 struct pblk_line_ws *line_put_ws;
1521
1522 line_put_ws = mempool_alloc(pblk->gen_ws_pool, GFP_ATOMIC);
1523 if (!line_put_ws)
1524 return;
1525
1526 line_put_ws->pblk = pblk;
1527 line_put_ws->line = line;
1528 line_put_ws->priv = NULL;
1529
1530 INIT_WORK(&line_put_ws->ws, pblk_line_put_ws);
1531 queue_work(pblk->r_end_wq, &line_put_ws->ws);
1532}
1533
a4bd217b
JG
1534int pblk_blk_erase_async(struct pblk *pblk, struct ppa_addr ppa)
1535{
1536 struct nvm_rq *rqd;
1537 int err;
1538
67bf26a3 1539 rqd = pblk_alloc_rqd(pblk, PBLK_ERASE);
a4bd217b
JG
1540
1541 pblk_setup_e_rq(pblk, rqd, ppa);
1542
1543 rqd->end_io = pblk_end_io_erase;
1544 rqd->private = pblk;
1545
1546 /* The write thread schedules erases so that it minimizes disturbances
1547 * with writes. Thus, there is no need to take the LUN semaphore.
1548 */
1549 err = pblk_submit_io(pblk, rqd);
1550 if (err) {
1551 struct nvm_tgt_dev *dev = pblk->dev;
1552 struct nvm_geo *geo = &dev->geo;
1553
1554 pr_err("pblk: could not async erase line:%d,blk:%d\n",
b1bcfda1
JG
1555 pblk_ppa_to_line(ppa),
1556 pblk_ppa_to_pos(geo, ppa));
a4bd217b
JG
1557 }
1558
1559 return err;
1560}
1561
1562struct pblk_line *pblk_line_get_data(struct pblk *pblk)
1563{
1564 return pblk->l_mg.data_line;
1565}
1566
d624f371
JG
1567/* For now, always erase next line */
1568struct pblk_line *pblk_line_get_erase(struct pblk *pblk)
a4bd217b
JG
1569{
1570 return pblk->l_mg.data_next;
1571}
1572
1573int pblk_line_is_full(struct pblk_line *line)
1574{
1575 return (line->left_msecs == 0);
1576}
1577
588726d3
JG
1578static void pblk_line_should_sync_meta(struct pblk *pblk)
1579{
1580 if (pblk_rl_is_limit(&pblk->rl))
1581 pblk_line_close_meta_sync(pblk);
1582}
1583
a4bd217b
JG
1584void pblk_line_close(struct pblk *pblk, struct pblk_line *line)
1585{
1586 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1587 struct list_head *move_list;
1588
a84ebb83
JG
1589#ifdef CONFIG_NVM_DEBUG
1590 struct pblk_line_meta *lm = &pblk->lm;
1591
dd2a4343 1592 WARN(!bitmap_full(line->map_bitmap, lm->sec_per_line),
a4bd217b 1593 "pblk: corrupt closed line %d\n", line->id);
a84ebb83 1594#endif
a4bd217b
JG
1595
1596 spin_lock(&l_mg->free_lock);
1597 WARN_ON(!test_and_clear_bit(line->meta_line, &l_mg->meta_bitmap));
1598 spin_unlock(&l_mg->free_lock);
1599
1600 spin_lock(&l_mg->gc_lock);
1601 spin_lock(&line->lock);
1602 WARN_ON(line->state != PBLK_LINESTATE_OPEN);
1603 line->state = PBLK_LINESTATE_CLOSED;
1604 move_list = pblk_line_gc_list(pblk, line);
1605
1606 list_add_tail(&line->list, move_list);
1607
e72ec1d3 1608 kfree(line->map_bitmap);
a4bd217b
JG
1609 line->map_bitmap = NULL;
1610 line->smeta = NULL;
1611 line->emeta = NULL;
1612
1613 spin_unlock(&line->lock);
1614 spin_unlock(&l_mg->gc_lock);
1615}
1616
dd2a4343
JG
1617void pblk_line_close_meta(struct pblk *pblk, struct pblk_line *line)
1618{
1619 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1620 struct pblk_line_meta *lm = &pblk->lm;
1621 struct pblk_emeta *emeta = line->emeta;
1622 struct line_emeta *emeta_buf = emeta->buf;
76758390 1623 struct wa_counters *wa = emeta_to_wa(lm, emeta_buf);
dd2a4343 1624
588726d3 1625 /* No need for exact vsc value; avoid a big line lock and take aprox. */
dd2a4343
JG
1626 memcpy(emeta_to_vsc(pblk, emeta_buf), l_mg->vsc_list, lm->vsc_list_len);
1627 memcpy(emeta_to_bb(emeta_buf), line->blk_bitmap, lm->blk_bitmap_len);
1628
76758390
HH
1629 wa->user = cpu_to_le64(atomic64_read(&pblk->user_wa));
1630 wa->pad = cpu_to_le64(atomic64_read(&pblk->pad_wa));
1631 wa->gc = cpu_to_le64(atomic64_read(&pblk->gc_wa));
1632
dd2a4343
JG
1633 emeta_buf->nr_valid_lbas = cpu_to_le64(line->nr_valid_lbas);
1634 emeta_buf->crc = cpu_to_le32(pblk_calc_emeta_crc(pblk, emeta_buf));
1635
1636 spin_lock(&l_mg->close_lock);
1637 spin_lock(&line->lock);
1638 list_add_tail(&line->list, &l_mg->emeta_list);
1639 spin_unlock(&line->lock);
1640 spin_unlock(&l_mg->close_lock);
588726d3
JG
1641
1642 pblk_line_should_sync_meta(pblk);
dd2a4343
JG
1643}
1644
a4bd217b
JG
1645void pblk_line_close_ws(struct work_struct *work)
1646{
1647 struct pblk_line_ws *line_ws = container_of(work, struct pblk_line_ws,
1648 ws);
1649 struct pblk *pblk = line_ws->pblk;
1650 struct pblk_line *line = line_ws->line;
1651
1652 pblk_line_close(pblk, line);
b84ae4a8 1653 mempool_free(line_ws, pblk->gen_ws_pool);
a4bd217b
JG
1654}
1655
b84ae4a8
JG
1656void pblk_gen_run_ws(struct pblk *pblk, struct pblk_line *line, void *priv,
1657 void (*work)(struct work_struct *), gfp_t gfp_mask,
ef576494 1658 struct workqueue_struct *wq)
a4bd217b
JG
1659{
1660 struct pblk_line_ws *line_ws;
1661
b84ae4a8 1662 line_ws = mempool_alloc(pblk->gen_ws_pool, gfp_mask);
a4bd217b
JG
1663
1664 line_ws->pblk = pblk;
1665 line_ws->line = line;
1666 line_ws->priv = priv;
1667
1668 INIT_WORK(&line_ws->ws, work);
ef576494 1669 queue_work(wq, &line_ws->ws);
a4bd217b
JG
1670}
1671
3eaa11e2
JG
1672static void __pblk_down_page(struct pblk *pblk, struct ppa_addr *ppa_list,
1673 int nr_ppas, int pos)
a4bd217b 1674{
3eaa11e2 1675 struct pblk_lun *rlun = &pblk->luns[pos];
a4bd217b
JG
1676 int ret;
1677
1678 /*
1679 * Only send one inflight I/O per LUN. Since we map at a page
1680 * granurality, all ppas in the I/O will map to the same LUN
1681 */
1682#ifdef CONFIG_NVM_DEBUG
1683 int i;
1684
1685 for (i = 1; i < nr_ppas; i++)
1686 WARN_ON(ppa_list[0].g.lun != ppa_list[i].g.lun ||
1687 ppa_list[0].g.ch != ppa_list[i].g.ch);
1688#endif
a4bd217b 1689
3eaa11e2 1690 ret = down_timeout(&rlun->wr_sem, msecs_to_jiffies(30000));
c5493845
RP
1691 if (ret == -ETIME || ret == -EINTR)
1692 pr_err("pblk: taking lun semaphore timed out: err %d\n", -ret);
a4bd217b
JG
1693}
1694
3eaa11e2
JG
1695void pblk_down_page(struct pblk *pblk, struct ppa_addr *ppa_list, int nr_ppas)
1696{
1697 struct nvm_tgt_dev *dev = pblk->dev;
1698 struct nvm_geo *geo = &dev->geo;
1699 int pos = pblk_ppa_to_pos(geo, ppa_list[0]);
1700
1701 __pblk_down_page(pblk, ppa_list, nr_ppas, pos);
1702}
1703
1704void pblk_down_rq(struct pblk *pblk, struct ppa_addr *ppa_list, int nr_ppas,
1705 unsigned long *lun_bitmap)
1706{
1707 struct nvm_tgt_dev *dev = pblk->dev;
1708 struct nvm_geo *geo = &dev->geo;
1709 int pos = pblk_ppa_to_pos(geo, ppa_list[0]);
1710
1711 /* If the LUN has been locked for this same request, do no attempt to
1712 * lock it again
1713 */
1714 if (test_and_set_bit(pos, lun_bitmap))
1715 return;
1716
1717 __pblk_down_page(pblk, ppa_list, nr_ppas, pos);
1718}
1719
1720void pblk_up_page(struct pblk *pblk, struct ppa_addr *ppa_list, int nr_ppas)
1721{
1722 struct nvm_tgt_dev *dev = pblk->dev;
1723 struct nvm_geo *geo = &dev->geo;
1724 struct pblk_lun *rlun;
1725 int pos = pblk_ppa_to_pos(geo, ppa_list[0]);
1726
1727#ifdef CONFIG_NVM_DEBUG
1728 int i;
1729
1730 for (i = 1; i < nr_ppas; i++)
1731 WARN_ON(ppa_list[0].g.lun != ppa_list[i].g.lun ||
1732 ppa_list[0].g.ch != ppa_list[i].g.ch);
1733#endif
1734
1735 rlun = &pblk->luns[pos];
1736 up(&rlun->wr_sem);
1737}
1738
a4bd217b
JG
1739void pblk_up_rq(struct pblk *pblk, struct ppa_addr *ppa_list, int nr_ppas,
1740 unsigned long *lun_bitmap)
1741{
1742 struct nvm_tgt_dev *dev = pblk->dev;
1743 struct nvm_geo *geo = &dev->geo;
1744 struct pblk_lun *rlun;
fae7fae4 1745 int nr_luns = geo->all_luns;
a4bd217b
JG
1746 int bit = -1;
1747
1748 while ((bit = find_next_bit(lun_bitmap, nr_luns, bit + 1)) < nr_luns) {
1749 rlun = &pblk->luns[bit];
1750 up(&rlun->wr_sem);
1751 }
a4bd217b
JG
1752}
1753
1754void pblk_update_map(struct pblk *pblk, sector_t lba, struct ppa_addr ppa)
1755{
9f6cb13b 1756 struct ppa_addr ppa_l2p;
a4bd217b
JG
1757
1758 /* logic error: lba out-of-bounds. Ignore update */
1759 if (!(lba < pblk->rl.nr_secs)) {
1760 WARN(1, "pblk: corrupted L2P map request\n");
1761 return;
1762 }
1763
1764 spin_lock(&pblk->trans_lock);
9f6cb13b 1765 ppa_l2p = pblk_trans_map_get(pblk, lba);
a4bd217b 1766
9f6cb13b
JG
1767 if (!pblk_addr_in_cache(ppa_l2p) && !pblk_ppa_empty(ppa_l2p))
1768 pblk_map_invalidate(pblk, ppa_l2p);
a4bd217b
JG
1769
1770 pblk_trans_map_set(pblk, lba, ppa);
1771 spin_unlock(&pblk->trans_lock);
1772}
1773
1774void pblk_update_map_cache(struct pblk *pblk, sector_t lba, struct ppa_addr ppa)
1775{
d340121e 1776
a4bd217b
JG
1777#ifdef CONFIG_NVM_DEBUG
1778 /* Callers must ensure that the ppa points to a cache address */
1779 BUG_ON(!pblk_addr_in_cache(ppa));
1780 BUG_ON(pblk_rb_pos_oob(&pblk->rwb, pblk_addr_to_cacheline(ppa)));
1781#endif
1782
1783 pblk_update_map(pblk, lba, ppa);
1784}
1785
9f6cb13b 1786int pblk_update_map_gc(struct pblk *pblk, sector_t lba, struct ppa_addr ppa_new,
d340121e 1787 struct pblk_line *gc_line, u64 paddr_gc)
a4bd217b 1788{
d340121e 1789 struct ppa_addr ppa_l2p, ppa_gc;
a4bd217b
JG
1790 int ret = 1;
1791
1792#ifdef CONFIG_NVM_DEBUG
1793 /* Callers must ensure that the ppa points to a cache address */
9f6cb13b
JG
1794 BUG_ON(!pblk_addr_in_cache(ppa_new));
1795 BUG_ON(pblk_rb_pos_oob(&pblk->rwb, pblk_addr_to_cacheline(ppa_new)));
a4bd217b
JG
1796#endif
1797
1798 /* logic error: lba out-of-bounds. Ignore update */
1799 if (!(lba < pblk->rl.nr_secs)) {
1800 WARN(1, "pblk: corrupted L2P map request\n");
1801 return 0;
1802 }
1803
1804 spin_lock(&pblk->trans_lock);
9f6cb13b 1805 ppa_l2p = pblk_trans_map_get(pblk, lba);
d340121e 1806 ppa_gc = addr_to_gen_ppa(pblk, paddr_gc, gc_line->id);
a4bd217b 1807
d340121e
JG
1808 if (!pblk_ppa_comp(ppa_l2p, ppa_gc)) {
1809 spin_lock(&gc_line->lock);
1810 WARN(!test_bit(paddr_gc, gc_line->invalid_bitmap),
1811 "pblk: corrupted GC update");
1812 spin_unlock(&gc_line->lock);
9f6cb13b 1813
a4bd217b
JG
1814 ret = 0;
1815 goto out;
1816 }
1817
9f6cb13b 1818 pblk_trans_map_set(pblk, lba, ppa_new);
a4bd217b
JG
1819out:
1820 spin_unlock(&pblk->trans_lock);
1821 return ret;
1822}
1823
9f6cb13b
JG
1824void pblk_update_map_dev(struct pblk *pblk, sector_t lba,
1825 struct ppa_addr ppa_mapped, struct ppa_addr ppa_cache)
a4bd217b 1826{
9f6cb13b 1827 struct ppa_addr ppa_l2p;
a4bd217b
JG
1828
1829#ifdef CONFIG_NVM_DEBUG
1830 /* Callers must ensure that the ppa points to a device address */
9f6cb13b 1831 BUG_ON(pblk_addr_in_cache(ppa_mapped));
a4bd217b
JG
1832#endif
1833 /* Invalidate and discard padded entries */
1834 if (lba == ADDR_EMPTY) {
76758390 1835 atomic64_inc(&pblk->pad_wa);
a4bd217b
JG
1836#ifdef CONFIG_NVM_DEBUG
1837 atomic_long_inc(&pblk->padded_wb);
1838#endif
9f6cb13b
JG
1839 if (!pblk_ppa_empty(ppa_mapped))
1840 pblk_map_invalidate(pblk, ppa_mapped);
a4bd217b
JG
1841 return;
1842 }
1843
1844 /* logic error: lba out-of-bounds. Ignore update */
1845 if (!(lba < pblk->rl.nr_secs)) {
1846 WARN(1, "pblk: corrupted L2P map request\n");
1847 return;
1848 }
1849
1850 spin_lock(&pblk->trans_lock);
9f6cb13b 1851 ppa_l2p = pblk_trans_map_get(pblk, lba);
a4bd217b
JG
1852
1853 /* Do not update L2P if the cacheline has been updated. In this case,
1854 * the mapped ppa must be invalidated
1855 */
9f6cb13b
JG
1856 if (!pblk_ppa_comp(ppa_l2p, ppa_cache)) {
1857 if (!pblk_ppa_empty(ppa_mapped))
1858 pblk_map_invalidate(pblk, ppa_mapped);
a4bd217b
JG
1859 goto out;
1860 }
1861
1862#ifdef CONFIG_NVM_DEBUG
9f6cb13b 1863 WARN_ON(!pblk_addr_in_cache(ppa_l2p) && !pblk_ppa_empty(ppa_l2p));
a4bd217b
JG
1864#endif
1865
9f6cb13b 1866 pblk_trans_map_set(pblk, lba, ppa_mapped);
a4bd217b
JG
1867out:
1868 spin_unlock(&pblk->trans_lock);
1869}
1870
1871void pblk_lookup_l2p_seq(struct pblk *pblk, struct ppa_addr *ppas,
1872 sector_t blba, int nr_secs)
1873{
1874 int i;
1875
1876 spin_lock(&pblk->trans_lock);
7bd4d370
JG
1877 for (i = 0; i < nr_secs; i++) {
1878 struct ppa_addr ppa;
1879
1880 ppa = ppas[i] = pblk_trans_map_get(pblk, blba + i);
1881
1882 /* If the L2P entry maps to a line, the reference is valid */
1883 if (!pblk_ppa_empty(ppa) && !pblk_addr_in_cache(ppa)) {
b1bcfda1 1884 int line_id = pblk_ppa_to_line(ppa);
7bd4d370
JG
1885 struct pblk_line *line = &pblk->lines[line_id];
1886
1887 kref_get(&line->ref);
1888 }
1889 }
a4bd217b
JG
1890 spin_unlock(&pblk->trans_lock);
1891}
1892
1893void pblk_lookup_l2p_rand(struct pblk *pblk, struct ppa_addr *ppas,
1894 u64 *lba_list, int nr_secs)
1895{
d340121e 1896 u64 lba;
a4bd217b
JG
1897 int i;
1898
1899 spin_lock(&pblk->trans_lock);
1900 for (i = 0; i < nr_secs; i++) {
1901 lba = lba_list[i];
d340121e 1902 if (lba != ADDR_EMPTY) {
a4bd217b
JG
1903 /* logic error: lba out-of-bounds. Ignore update */
1904 if (!(lba < pblk->rl.nr_secs)) {
1905 WARN(1, "pblk: corrupted L2P map request\n");
1906 continue;
1907 }
1908 ppas[i] = pblk_trans_map_get(pblk, lba);
1909 }
1910 }
1911 spin_unlock(&pblk->trans_lock);
1912}