lightnvm: convert to bioset_init()/mempool_init()
[linux-2.6-block.git] / drivers / lightnvm / pblk-core.c
CommitLineData
a4bd217b
JG
1/*
2 * Copyright (C) 2016 CNEX Labs
3 * Initial release: Javier Gonzalez <javier@cnexlabs.com>
4 * Matias Bjorling <matias@cnexlabs.com>
5 *
6 * This program is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU General Public License version
8 * 2 as published by the Free Software Foundation.
9 *
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License for more details.
14 *
15 * pblk-core.c - pblk's core functionality
16 *
17 */
18
19#include "pblk.h"
a4bd217b 20
8bd40020
JG
21static void pblk_line_mark_bb(struct work_struct *work)
22{
23 struct pblk_line_ws *line_ws = container_of(work, struct pblk_line_ws,
24 ws);
25 struct pblk *pblk = line_ws->pblk;
26 struct nvm_tgt_dev *dev = pblk->dev;
27 struct ppa_addr *ppa = line_ws->priv;
28 int ret;
29
30 ret = nvm_set_tgt_bb_tbl(dev, ppa, 1, NVM_BLK_T_GRWN_BAD);
31 if (ret) {
32 struct pblk_line *line;
33 int pos;
34
b1bcfda1
JG
35 line = &pblk->lines[pblk_ppa_to_line(*ppa)];
36 pos = pblk_ppa_to_pos(&dev->geo, *ppa);
8bd40020
JG
37
38 pr_err("pblk: failed to mark bb, line:%d, pos:%d\n",
39 line->id, pos);
40 }
41
42 kfree(ppa);
b906bbb6 43 mempool_free(line_ws, &pblk->gen_ws_pool);
8bd40020
JG
44}
45
a4bd217b 46static void pblk_mark_bb(struct pblk *pblk, struct pblk_line *line,
32ef9412 47 struct ppa_addr ppa_addr)
a4bd217b
JG
48{
49 struct nvm_tgt_dev *dev = pblk->dev;
50 struct nvm_geo *geo = &dev->geo;
32ef9412
JG
51 struct ppa_addr *ppa;
52 int pos = pblk_ppa_to_pos(geo, ppa_addr);
a4bd217b
JG
53
54 pr_debug("pblk: erase failed: line:%d, pos:%d\n", line->id, pos);
55 atomic_long_inc(&pblk->erase_failed);
56
a44f53fa 57 atomic_dec(&line->blk_in_line);
a4bd217b
JG
58 if (test_and_set_bit(pos, line->blk_bitmap))
59 pr_err("pblk: attempted to erase bb: line:%d, pos:%d\n",
60 line->id, pos);
61
32ef9412
JG
62 /* Not necessary to mark bad blocks on 2.0 spec. */
63 if (geo->version == NVM_OCSSD_SPEC_20)
64 return;
65
66 ppa = kmalloc(sizeof(struct ppa_addr), GFP_ATOMIC);
67 if (!ppa)
68 return;
69
70 *ppa = ppa_addr;
b84ae4a8
JG
71 pblk_gen_run_ws(pblk, NULL, ppa, pblk_line_mark_bb,
72 GFP_ATOMIC, pblk->bb_wq);
a4bd217b
JG
73}
74
75static void __pblk_end_io_erase(struct pblk *pblk, struct nvm_rq *rqd)
76{
32ef9412
JG
77 struct nvm_tgt_dev *dev = pblk->dev;
78 struct nvm_geo *geo = &dev->geo;
79 struct nvm_chk_meta *chunk;
a4bd217b 80 struct pblk_line *line;
32ef9412 81 int pos;
a4bd217b 82
b1bcfda1 83 line = &pblk->lines[pblk_ppa_to_line(rqd->ppa_addr)];
32ef9412
JG
84 pos = pblk_ppa_to_pos(geo, rqd->ppa_addr);
85 chunk = &line->chks[pos];
86
a4bd217b
JG
87 atomic_dec(&line->left_seblks);
88
89 if (rqd->error) {
32ef9412
JG
90 chunk->state = NVM_CHK_ST_OFFLINE;
91 pblk_mark_bb(pblk, line, rqd->ppa_addr);
92 } else {
93 chunk->state = NVM_CHK_ST_FREE;
a4bd217b 94 }
588726d3
JG
95
96 atomic_dec(&pblk->inflight_io);
a4bd217b
JG
97}
98
99/* Erase completion assumes that only one block is erased at the time */
100static void pblk_end_io_erase(struct nvm_rq *rqd)
101{
102 struct pblk *pblk = rqd->private;
103
a4bd217b 104 __pblk_end_io_erase(pblk, rqd);
b906bbb6 105 mempool_free(rqd, &pblk->e_rq_pool);
a4bd217b
JG
106}
107
32ef9412
JG
108/*
109 * Get information for all chunks from the device.
110 *
111 * The caller is responsible for freeing the returned structure
112 */
113struct nvm_chk_meta *pblk_chunk_get_info(struct pblk *pblk)
114{
115 struct nvm_tgt_dev *dev = pblk->dev;
116 struct nvm_geo *geo = &dev->geo;
117 struct nvm_chk_meta *meta;
118 struct ppa_addr ppa;
119 unsigned long len;
120 int ret;
121
122 ppa.ppa = 0;
123
124 len = geo->all_chunks * sizeof(*meta);
125 meta = kzalloc(len, GFP_KERNEL);
126 if (!meta)
127 return ERR_PTR(-ENOMEM);
128
129 ret = nvm_get_chunk_meta(dev, meta, ppa, geo->all_chunks);
130 if (ret) {
131 kfree(meta);
132 return ERR_PTR(-EIO);
133 }
134
135 return meta;
136}
137
138struct nvm_chk_meta *pblk_chunk_get_off(struct pblk *pblk,
139 struct nvm_chk_meta *meta,
140 struct ppa_addr ppa)
141{
142 struct nvm_tgt_dev *dev = pblk->dev;
143 struct nvm_geo *geo = &dev->geo;
144 int ch_off = ppa.m.grp * geo->num_chk * geo->num_lun;
145 int lun_off = ppa.m.pu * geo->num_chk;
146 int chk_off = ppa.m.chk;
147
148 return meta + ch_off + lun_off + chk_off;
149}
150
0880a9aa
JG
151void __pblk_map_invalidate(struct pblk *pblk, struct pblk_line *line,
152 u64 paddr)
a4bd217b
JG
153{
154 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
155 struct list_head *move_list = NULL;
156
157 /* Lines being reclaimed (GC'ed) cannot be invalidated. Before the L2P
158 * table is modified with reclaimed sectors, a check is done to endure
159 * that newer updates are not overwritten.
160 */
161 spin_lock(&line->lock);
d340121e 162 WARN_ON(line->state == PBLK_LINESTATE_FREE);
a4bd217b
JG
163
164 if (test_and_set_bit(paddr, line->invalid_bitmap)) {
165 WARN_ONCE(1, "pblk: double invalidate\n");
166 spin_unlock(&line->lock);
167 return;
168 }
dd2a4343 169 le32_add_cpu(line->vsc, -1);
a4bd217b
JG
170
171 if (line->state == PBLK_LINESTATE_CLOSED)
172 move_list = pblk_line_gc_list(pblk, line);
173 spin_unlock(&line->lock);
174
175 if (move_list) {
176 spin_lock(&l_mg->gc_lock);
177 spin_lock(&line->lock);
178 /* Prevent moving a line that has just been chosen for GC */
d340121e 179 if (line->state == PBLK_LINESTATE_GC) {
a4bd217b
JG
180 spin_unlock(&line->lock);
181 spin_unlock(&l_mg->gc_lock);
182 return;
183 }
184 spin_unlock(&line->lock);
185
186 list_move_tail(&line->list, move_list);
187 spin_unlock(&l_mg->gc_lock);
188 }
189}
190
191void pblk_map_invalidate(struct pblk *pblk, struct ppa_addr ppa)
192{
193 struct pblk_line *line;
194 u64 paddr;
195 int line_id;
196
197#ifdef CONFIG_NVM_DEBUG
198 /* Callers must ensure that the ppa points to a device address */
199 BUG_ON(pblk_addr_in_cache(ppa));
200 BUG_ON(pblk_ppa_empty(ppa));
201#endif
202
b1bcfda1 203 line_id = pblk_ppa_to_line(ppa);
a4bd217b
JG
204 line = &pblk->lines[line_id];
205 paddr = pblk_dev_ppa_to_line_addr(pblk, ppa);
206
207 __pblk_map_invalidate(pblk, line, paddr);
208}
209
a4bd217b
JG
210static void pblk_invalidate_range(struct pblk *pblk, sector_t slba,
211 unsigned int nr_secs)
212{
213 sector_t lba;
214
215 spin_lock(&pblk->trans_lock);
216 for (lba = slba; lba < slba + nr_secs; lba++) {
217 struct ppa_addr ppa;
218
219 ppa = pblk_trans_map_get(pblk, lba);
220
221 if (!pblk_addr_in_cache(ppa) && !pblk_ppa_empty(ppa))
222 pblk_map_invalidate(pblk, ppa);
223
224 pblk_ppa_set_empty(&ppa);
225 pblk_trans_map_set(pblk, lba, ppa);
226 }
227 spin_unlock(&pblk->trans_lock);
228}
229
67bf26a3
JG
230/* Caller must guarantee that the request is a valid type */
231struct nvm_rq *pblk_alloc_rqd(struct pblk *pblk, int type)
a4bd217b
JG
232{
233 mempool_t *pool;
234 struct nvm_rq *rqd;
235 int rq_size;
236
67bf26a3
JG
237 switch (type) {
238 case PBLK_WRITE:
239 case PBLK_WRITE_INT:
b906bbb6 240 pool = &pblk->w_rq_pool;
a4bd217b 241 rq_size = pblk_w_rq_size;
67bf26a3
JG
242 break;
243 case PBLK_READ:
b906bbb6 244 pool = &pblk->r_rq_pool;
084ec9ba 245 rq_size = pblk_g_rq_size;
67bf26a3
JG
246 break;
247 default:
b906bbb6 248 pool = &pblk->e_rq_pool;
67bf26a3 249 rq_size = pblk_g_rq_size;
a4bd217b
JG
250 }
251
252 rqd = mempool_alloc(pool, GFP_KERNEL);
253 memset(rqd, 0, rq_size);
254
255 return rqd;
256}
257
67bf26a3
JG
258/* Typically used on completion path. Cannot guarantee request consistency */
259void pblk_free_rqd(struct pblk *pblk, struct nvm_rq *rqd, int type)
a4bd217b 260{
67bf26a3 261 struct nvm_tgt_dev *dev = pblk->dev;
a4bd217b
JG
262 mempool_t *pool;
263
67bf26a3
JG
264 switch (type) {
265 case PBLK_WRITE:
266 kfree(((struct pblk_c_ctx *)nvm_rq_to_pdu(rqd))->lun_bitmap);
267 case PBLK_WRITE_INT:
b906bbb6 268 pool = &pblk->w_rq_pool;
67bf26a3
JG
269 break;
270 case PBLK_READ:
b906bbb6 271 pool = &pblk->r_rq_pool;
67bf26a3
JG
272 break;
273 case PBLK_ERASE:
b906bbb6 274 pool = &pblk->e_rq_pool;
67bf26a3
JG
275 break;
276 default:
277 pr_err("pblk: trying to free unknown rqd type\n");
278 return;
279 }
a4bd217b 280
67bf26a3 281 nvm_dev_dma_free(dev->parent, rqd->meta_list, rqd->dma_meta_list);
a4bd217b
JG
282 mempool_free(rqd, pool);
283}
284
285void pblk_bio_free_pages(struct pblk *pblk, struct bio *bio, int off,
286 int nr_pages)
287{
288 struct bio_vec bv;
289 int i;
290
291 WARN_ON(off + nr_pages != bio->bi_vcnt);
292
a4bd217b
JG
293 for (i = off; i < nr_pages + off; i++) {
294 bv = bio->bi_io_vec[i];
b906bbb6 295 mempool_free(bv.bv_page, &pblk->page_bio_pool);
a4bd217b
JG
296 }
297}
298
299int pblk_bio_add_pages(struct pblk *pblk, struct bio *bio, gfp_t flags,
300 int nr_pages)
301{
302 struct request_queue *q = pblk->dev->q;
303 struct page *page;
304 int i, ret;
305
306 for (i = 0; i < nr_pages; i++) {
b906bbb6 307 page = mempool_alloc(&pblk->page_bio_pool, flags);
a4bd217b
JG
308
309 ret = bio_add_pc_page(q, bio, page, PBLK_EXPOSED_PAGE_SIZE, 0);
310 if (ret != PBLK_EXPOSED_PAGE_SIZE) {
311 pr_err("pblk: could not add page to bio\n");
b906bbb6 312 mempool_free(page, &pblk->page_bio_pool);
a4bd217b
JG
313 goto err;
314 }
315 }
316
317 return 0;
318err:
319 pblk_bio_free_pages(pblk, bio, 0, i - 1);
320 return -1;
321}
322
323static void pblk_write_kick(struct pblk *pblk)
324{
325 wake_up_process(pblk->writer_ts);
326 mod_timer(&pblk->wtimer, jiffies + msecs_to_jiffies(1000));
327}
328
87c1d2d3 329void pblk_write_timer_fn(struct timer_list *t)
a4bd217b 330{
87c1d2d3 331 struct pblk *pblk = from_timer(pblk, t, wtimer);
a4bd217b
JG
332
333 /* kick the write thread every tick to flush outstanding data */
334 pblk_write_kick(pblk);
335}
336
337void pblk_write_should_kick(struct pblk *pblk)
338{
339 unsigned int secs_avail = pblk_rb_read_count(&pblk->rwb);
340
341 if (secs_avail >= pblk->min_write_pgs)
342 pblk_write_kick(pblk);
343}
344
a4bd217b
JG
345void pblk_end_io_sync(struct nvm_rq *rqd)
346{
347 struct completion *waiting = rqd->private;
348
349 complete(waiting);
350}
351
8bd40020 352static void pblk_wait_for_meta(struct pblk *pblk)
a4bd217b 353{
588726d3
JG
354 do {
355 if (!atomic_read(&pblk->inflight_io))
356 break;
a4bd217b 357
588726d3
JG
358 schedule();
359 } while (1);
360}
a4bd217b 361
588726d3
JG
362static void pblk_flush_writer(struct pblk *pblk)
363{
364 pblk_rb_flush(&pblk->rwb);
365 do {
ee8d5c1a 366 if (!pblk_rb_sync_count(&pblk->rwb))
588726d3 367 break;
a4bd217b 368
ee8d5c1a 369 pblk_write_kick(pblk);
588726d3
JG
370 schedule();
371 } while (1);
a4bd217b
JG
372}
373
374struct list_head *pblk_line_gc_list(struct pblk *pblk, struct pblk_line *line)
375{
376 struct pblk_line_meta *lm = &pblk->lm;
377 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
378 struct list_head *move_list = NULL;
dd2a4343 379 int vsc = le32_to_cpu(*line->vsc);
a4bd217b 380
476118c9
JG
381 lockdep_assert_held(&line->lock);
382
dd2a4343 383 if (!vsc) {
a4bd217b
JG
384 if (line->gc_group != PBLK_LINEGC_FULL) {
385 line->gc_group = PBLK_LINEGC_FULL;
386 move_list = &l_mg->gc_full_list;
387 }
b20ba1bc 388 } else if (vsc < lm->high_thrs) {
a4bd217b
JG
389 if (line->gc_group != PBLK_LINEGC_HIGH) {
390 line->gc_group = PBLK_LINEGC_HIGH;
391 move_list = &l_mg->gc_high_list;
392 }
b20ba1bc 393 } else if (vsc < lm->mid_thrs) {
a4bd217b
JG
394 if (line->gc_group != PBLK_LINEGC_MID) {
395 line->gc_group = PBLK_LINEGC_MID;
396 move_list = &l_mg->gc_mid_list;
397 }
dd2a4343 398 } else if (vsc < line->sec_in_line) {
a4bd217b
JG
399 if (line->gc_group != PBLK_LINEGC_LOW) {
400 line->gc_group = PBLK_LINEGC_LOW;
401 move_list = &l_mg->gc_low_list;
402 }
dd2a4343 403 } else if (vsc == line->sec_in_line) {
a4bd217b
JG
404 if (line->gc_group != PBLK_LINEGC_EMPTY) {
405 line->gc_group = PBLK_LINEGC_EMPTY;
406 move_list = &l_mg->gc_empty_list;
407 }
408 } else {
409 line->state = PBLK_LINESTATE_CORRUPT;
410 line->gc_group = PBLK_LINEGC_NONE;
411 move_list = &l_mg->corrupt_list;
412 pr_err("pblk: corrupted vsc for line %d, vsc:%d (%d/%d/%d)\n",
dd2a4343 413 line->id, vsc,
a4bd217b
JG
414 line->sec_in_line,
415 lm->high_thrs, lm->mid_thrs);
416 }
417
418 return move_list;
419}
420
421void pblk_discard(struct pblk *pblk, struct bio *bio)
422{
423 sector_t slba = pblk_get_lba(bio);
424 sector_t nr_secs = pblk_get_secs(bio);
425
426 pblk_invalidate_range(pblk, slba, nr_secs);
427}
428
a4bd217b
JG
429void pblk_log_write_err(struct pblk *pblk, struct nvm_rq *rqd)
430{
431 atomic_long_inc(&pblk->write_failed);
432#ifdef CONFIG_NVM_DEBUG
433 pblk_print_failed_rqd(pblk, rqd, rqd->error);
434#endif
435}
436
437void pblk_log_read_err(struct pblk *pblk, struct nvm_rq *rqd)
438{
439 /* Empty page read is not necessarily an error (e.g., L2P recovery) */
440 if (rqd->error == NVM_RSP_ERR_EMPTYPAGE) {
441 atomic_long_inc(&pblk->read_empty);
442 return;
443 }
444
445 switch (rqd->error) {
446 case NVM_RSP_WARN_HIGHECC:
447 atomic_long_inc(&pblk->read_high_ecc);
448 break;
449 case NVM_RSP_ERR_FAILECC:
450 case NVM_RSP_ERR_FAILCRC:
451 atomic_long_inc(&pblk->read_failed);
452 break;
453 default:
454 pr_err("pblk: unknown read error:%d\n", rqd->error);
455 }
456#ifdef CONFIG_NVM_DEBUG
457 pblk_print_failed_rqd(pblk, rqd, rqd->error);
458#endif
459}
460
c2e9f5d4
JG
461void pblk_set_sec_per_write(struct pblk *pblk, int sec_per_write)
462{
463 pblk->sec_per_write = sec_per_write;
464}
465
a4bd217b
JG
466int pblk_submit_io(struct pblk *pblk, struct nvm_rq *rqd)
467{
468 struct nvm_tgt_dev *dev = pblk->dev;
469
470#ifdef CONFIG_NVM_DEBUG
1a94b2d4 471 int ret;
a4bd217b 472
1a94b2d4
JG
473 ret = pblk_check_io(pblk, rqd);
474 if (ret)
475 return ret;
476#endif
a4bd217b 477
1a94b2d4 478 atomic_inc(&pblk->inflight_io);
a4bd217b 479
1a94b2d4
JG
480 return nvm_submit_io(dev, rqd);
481}
a4bd217b 482
1a94b2d4
JG
483int pblk_submit_io_sync(struct pblk *pblk, struct nvm_rq *rqd)
484{
485 struct nvm_tgt_dev *dev = pblk->dev;
486
487#ifdef CONFIG_NVM_DEBUG
488 int ret;
489
490 ret = pblk_check_io(pblk, rqd);
491 if (ret)
492 return ret;
a4bd217b 493#endif
588726d3
JG
494
495 atomic_inc(&pblk->inflight_io);
496
1a94b2d4 497 return nvm_submit_io_sync(dev, rqd);
a4bd217b
JG
498}
499
55e836d4
JG
500static void pblk_bio_map_addr_endio(struct bio *bio)
501{
502 bio_put(bio);
503}
504
a4bd217b
JG
505struct bio *pblk_bio_map_addr(struct pblk *pblk, void *data,
506 unsigned int nr_secs, unsigned int len,
de54e703 507 int alloc_type, gfp_t gfp_mask)
a4bd217b
JG
508{
509 struct nvm_tgt_dev *dev = pblk->dev;
a4bd217b
JG
510 void *kaddr = data;
511 struct page *page;
512 struct bio *bio;
513 int i, ret;
514
de54e703 515 if (alloc_type == PBLK_KMALLOC_META)
a4bd217b
JG
516 return bio_map_kern(dev->q, kaddr, len, gfp_mask);
517
518 bio = bio_kmalloc(gfp_mask, nr_secs);
519 if (!bio)
520 return ERR_PTR(-ENOMEM);
521
522 for (i = 0; i < nr_secs; i++) {
523 page = vmalloc_to_page(kaddr);
524 if (!page) {
525 pr_err("pblk: could not map vmalloc bio\n");
526 bio_put(bio);
527 bio = ERR_PTR(-ENOMEM);
528 goto out;
529 }
530
531 ret = bio_add_pc_page(dev->q, bio, page, PAGE_SIZE, 0);
532 if (ret != PAGE_SIZE) {
533 pr_err("pblk: could not add page to bio\n");
534 bio_put(bio);
535 bio = ERR_PTR(-ENOMEM);
536 goto out;
537 }
538
539 kaddr += PAGE_SIZE;
540 }
55e836d4
JG
541
542 bio->bi_end_io = pblk_bio_map_addr_endio;
a4bd217b
JG
543out:
544 return bio;
545}
546
547int pblk_calc_secs(struct pblk *pblk, unsigned long secs_avail,
548 unsigned long secs_to_flush)
549{
c2e9f5d4 550 int max = pblk->sec_per_write;
a4bd217b
JG
551 int min = pblk->min_write_pgs;
552 int secs_to_sync = 0;
553
554 if (secs_avail >= max)
555 secs_to_sync = max;
556 else if (secs_avail >= min)
557 secs_to_sync = min * (secs_avail / min);
558 else if (secs_to_flush)
559 secs_to_sync = min;
560
561 return secs_to_sync;
562}
563
dd2a4343
JG
564void pblk_dealloc_page(struct pblk *pblk, struct pblk_line *line, int nr_secs)
565{
566 u64 addr;
567 int i;
568
e57903fd 569 spin_lock(&line->lock);
dd2a4343
JG
570 addr = find_next_zero_bit(line->map_bitmap,
571 pblk->lm.sec_per_line, line->cur_sec);
572 line->cur_sec = addr - nr_secs;
573
574 for (i = 0; i < nr_secs; i++, line->cur_sec--)
575 WARN_ON(!test_and_clear_bit(line->cur_sec, line->map_bitmap));
e57903fd 576 spin_unlock(&line->lock);
dd2a4343
JG
577}
578
579u64 __pblk_alloc_page(struct pblk *pblk, struct pblk_line *line, int nr_secs)
a4bd217b
JG
580{
581 u64 addr;
582 int i;
583
476118c9
JG
584 lockdep_assert_held(&line->lock);
585
a4bd217b
JG
586 /* logic error: ppa out-of-bounds. Prevent generating bad address */
587 if (line->cur_sec + nr_secs > pblk->lm.sec_per_line) {
588 WARN(1, "pblk: page allocation out of bounds\n");
589 nr_secs = pblk->lm.sec_per_line - line->cur_sec;
590 }
591
592 line->cur_sec = addr = find_next_zero_bit(line->map_bitmap,
593 pblk->lm.sec_per_line, line->cur_sec);
594 for (i = 0; i < nr_secs; i++, line->cur_sec++)
595 WARN_ON(test_and_set_bit(line->cur_sec, line->map_bitmap));
596
597 return addr;
598}
599
600u64 pblk_alloc_page(struct pblk *pblk, struct pblk_line *line, int nr_secs)
601{
602 u64 addr;
603
604 /* Lock needed in case a write fails and a recovery needs to remap
605 * failed write buffer entries
606 */
607 spin_lock(&line->lock);
608 addr = __pblk_alloc_page(pblk, line, nr_secs);
609 line->left_msecs -= nr_secs;
610 WARN(line->left_msecs < 0, "pblk: page allocation out of bounds\n");
611 spin_unlock(&line->lock);
612
613 return addr;
614}
615
dd2a4343
JG
616u64 pblk_lookup_page(struct pblk *pblk, struct pblk_line *line)
617{
618 u64 paddr;
619
620 spin_lock(&line->lock);
621 paddr = find_next_zero_bit(line->map_bitmap,
622 pblk->lm.sec_per_line, line->cur_sec);
623 spin_unlock(&line->lock);
624
625 return paddr;
626}
627
a4bd217b
JG
628/*
629 * Submit emeta to one LUN in the raid line at the time to avoid a deadlock when
630 * taking the per LUN semaphore.
631 */
632static int pblk_line_submit_emeta_io(struct pblk *pblk, struct pblk_line *line,
dd2a4343 633 void *emeta_buf, u64 paddr, int dir)
a4bd217b
JG
634{
635 struct nvm_tgt_dev *dev = pblk->dev;
636 struct nvm_geo *geo = &dev->geo;
de54e703 637 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
a4bd217b 638 struct pblk_line_meta *lm = &pblk->lm;
63e3809c 639 void *ppa_list, *meta_list;
a4bd217b
JG
640 struct bio *bio;
641 struct nvm_rq rqd;
63e3809c 642 dma_addr_t dma_ppa_list, dma_meta_list;
a4bd217b 643 int min = pblk->min_write_pgs;
dd2a4343 644 int left_ppas = lm->emeta_sec[0];
a4bd217b
JG
645 int id = line->id;
646 int rq_ppas, rq_len;
647 int cmd_op, bio_op;
a4bd217b
JG
648 int i, j;
649 int ret;
a4bd217b 650
e2cddf20 651 if (dir == PBLK_WRITE) {
a4bd217b
JG
652 bio_op = REQ_OP_WRITE;
653 cmd_op = NVM_OP_PWRITE;
e2cddf20 654 } else if (dir == PBLK_READ) {
a4bd217b
JG
655 bio_op = REQ_OP_READ;
656 cmd_op = NVM_OP_PREAD;
a4bd217b
JG
657 } else
658 return -EINVAL;
659
63e3809c
JG
660 meta_list = nvm_dev_dma_alloc(dev->parent, GFP_KERNEL,
661 &dma_meta_list);
662 if (!meta_list)
a4bd217b
JG
663 return -ENOMEM;
664
63e3809c
JG
665 ppa_list = meta_list + pblk_dma_meta_size;
666 dma_ppa_list = dma_meta_list + pblk_dma_meta_size;
667
a4bd217b
JG
668next_rq:
669 memset(&rqd, 0, sizeof(struct nvm_rq));
670
671 rq_ppas = pblk_calc_secs(pblk, left_ppas, 0);
e46f4e48 672 rq_len = rq_ppas * geo->csecs;
a4bd217b 673
de54e703
JG
674 bio = pblk_bio_map_addr(pblk, emeta_buf, rq_ppas, rq_len,
675 l_mg->emeta_alloc_type, GFP_KERNEL);
a4bd217b
JG
676 if (IS_ERR(bio)) {
677 ret = PTR_ERR(bio);
678 goto free_rqd_dma;
679 }
680
681 bio->bi_iter.bi_sector = 0; /* internal bio */
682 bio_set_op_attrs(bio, bio_op, 0);
683
684 rqd.bio = bio;
63e3809c 685 rqd.meta_list = meta_list;
a4bd217b 686 rqd.ppa_list = ppa_list;
63e3809c 687 rqd.dma_meta_list = dma_meta_list;
a4bd217b 688 rqd.dma_ppa_list = dma_ppa_list;
63e3809c
JG
689 rqd.opcode = cmd_op;
690 rqd.nr_ppas = rq_ppas;
a4bd217b 691
e2cddf20 692 if (dir == PBLK_WRITE) {
63e3809c
JG
693 struct pblk_sec_meta *meta_list = rqd.meta_list;
694
e2cddf20 695 rqd.flags = pblk_set_progr_mode(pblk, PBLK_WRITE);
a4bd217b
JG
696 for (i = 0; i < rqd.nr_ppas; ) {
697 spin_lock(&line->lock);
698 paddr = __pblk_alloc_page(pblk, line, min);
699 spin_unlock(&line->lock);
63e3809c
JG
700 for (j = 0; j < min; j++, i++, paddr++) {
701 meta_list[i].lba = cpu_to_le64(ADDR_EMPTY);
a4bd217b
JG
702 rqd.ppa_list[i] =
703 addr_to_gen_ppa(pblk, paddr, id);
63e3809c 704 }
a4bd217b
JG
705 }
706 } else {
707 for (i = 0; i < rqd.nr_ppas; ) {
708 struct ppa_addr ppa = addr_to_gen_ppa(pblk, paddr, id);
b1bcfda1 709 int pos = pblk_ppa_to_pos(geo, ppa);
f9c10152
JG
710 int read_type = PBLK_READ_RANDOM;
711
712 if (pblk_io_aligned(pblk, rq_ppas))
713 read_type = PBLK_READ_SEQUENTIAL;
714 rqd.flags = pblk_set_read_mode(pblk, read_type);
a4bd217b
JG
715
716 while (test_bit(pos, line->blk_bitmap)) {
717 paddr += min;
718 if (pblk_boundary_paddr_checks(pblk, paddr)) {
719 pr_err("pblk: corrupt emeta line:%d\n",
720 line->id);
721 bio_put(bio);
722 ret = -EINTR;
723 goto free_rqd_dma;
724 }
725
726 ppa = addr_to_gen_ppa(pblk, paddr, id);
b1bcfda1 727 pos = pblk_ppa_to_pos(geo, ppa);
a4bd217b
JG
728 }
729
730 if (pblk_boundary_paddr_checks(pblk, paddr + min)) {
731 pr_err("pblk: corrupt emeta line:%d\n",
732 line->id);
733 bio_put(bio);
734 ret = -EINTR;
735 goto free_rqd_dma;
736 }
737
738 for (j = 0; j < min; j++, i++, paddr++)
739 rqd.ppa_list[i] =
740 addr_to_gen_ppa(pblk, paddr, line->id);
741 }
742 }
743
1a94b2d4 744 ret = pblk_submit_io_sync(pblk, &rqd);
a4bd217b
JG
745 if (ret) {
746 pr_err("pblk: emeta I/O submission failed: %d\n", ret);
747 bio_put(bio);
748 goto free_rqd_dma;
749 }
750
588726d3 751 atomic_dec(&pblk->inflight_io);
a4bd217b 752
a4bd217b 753 if (rqd.error) {
e2cddf20 754 if (dir == PBLK_WRITE)
a4bd217b
JG
755 pblk_log_write_err(pblk, &rqd);
756 else
757 pblk_log_read_err(pblk, &rqd);
758 }
759
dd2a4343 760 emeta_buf += rq_len;
a4bd217b
JG
761 left_ppas -= rq_ppas;
762 if (left_ppas)
763 goto next_rq;
764free_rqd_dma:
63e3809c 765 nvm_dev_dma_free(dev->parent, rqd.meta_list, rqd.dma_meta_list);
a4bd217b
JG
766 return ret;
767}
768
769u64 pblk_line_smeta_start(struct pblk *pblk, struct pblk_line *line)
770{
771 struct nvm_tgt_dev *dev = pblk->dev;
772 struct nvm_geo *geo = &dev->geo;
773 struct pblk_line_meta *lm = &pblk->lm;
774 int bit;
775
776 /* This usually only happens on bad lines */
777 bit = find_first_zero_bit(line->blk_bitmap, lm->blk_per_line);
778 if (bit >= lm->blk_per_line)
779 return -1;
780
e46f4e48 781 return bit * geo->ws_opt;
a4bd217b
JG
782}
783
784static int pblk_line_submit_smeta_io(struct pblk *pblk, struct pblk_line *line,
785 u64 paddr, int dir)
786{
787 struct nvm_tgt_dev *dev = pblk->dev;
788 struct pblk_line_meta *lm = &pblk->lm;
789 struct bio *bio;
790 struct nvm_rq rqd;
791 __le64 *lba_list = NULL;
792 int i, ret;
793 int cmd_op, bio_op;
794 int flags;
a4bd217b 795
e2cddf20 796 if (dir == PBLK_WRITE) {
a4bd217b
JG
797 bio_op = REQ_OP_WRITE;
798 cmd_op = NVM_OP_PWRITE;
e2cddf20 799 flags = pblk_set_progr_mode(pblk, PBLK_WRITE);
dd2a4343 800 lba_list = emeta_to_lbas(pblk, line->emeta->buf);
8f554597 801 } else if (dir == PBLK_READ_RECOV || dir == PBLK_READ) {
a4bd217b
JG
802 bio_op = REQ_OP_READ;
803 cmd_op = NVM_OP_PREAD;
f9c10152 804 flags = pblk_set_read_mode(pblk, PBLK_READ_SEQUENTIAL);
a4bd217b
JG
805 } else
806 return -EINVAL;
807
808 memset(&rqd, 0, sizeof(struct nvm_rq));
809
63e3809c
JG
810 rqd.meta_list = nvm_dev_dma_alloc(dev->parent, GFP_KERNEL,
811 &rqd.dma_meta_list);
812 if (!rqd.meta_list)
a4bd217b
JG
813 return -ENOMEM;
814
63e3809c
JG
815 rqd.ppa_list = rqd.meta_list + pblk_dma_meta_size;
816 rqd.dma_ppa_list = rqd.dma_meta_list + pblk_dma_meta_size;
817
a4bd217b
JG
818 bio = bio_map_kern(dev->q, line->smeta, lm->smeta_len, GFP_KERNEL);
819 if (IS_ERR(bio)) {
820 ret = PTR_ERR(bio);
821 goto free_ppa_list;
822 }
823
824 bio->bi_iter.bi_sector = 0; /* internal bio */
825 bio_set_op_attrs(bio, bio_op, 0);
826
827 rqd.bio = bio;
828 rqd.opcode = cmd_op;
829 rqd.flags = flags;
830 rqd.nr_ppas = lm->smeta_sec;
a4bd217b
JG
831
832 for (i = 0; i < lm->smeta_sec; i++, paddr++) {
63e3809c
JG
833 struct pblk_sec_meta *meta_list = rqd.meta_list;
834
a4bd217b 835 rqd.ppa_list[i] = addr_to_gen_ppa(pblk, paddr, line->id);
63e3809c 836
e2cddf20 837 if (dir == PBLK_WRITE) {
f417aa0b 838 __le64 addr_empty = cpu_to_le64(ADDR_EMPTY);
63e3809c
JG
839
840 meta_list[i].lba = lba_list[paddr] = addr_empty;
841 }
a4bd217b
JG
842 }
843
844 /*
845 * This I/O is sent by the write thread when a line is replace. Since
846 * the write thread is the only one sending write and erase commands,
847 * there is no need to take the LUN semaphore.
848 */
1a94b2d4 849 ret = pblk_submit_io_sync(pblk, &rqd);
a4bd217b
JG
850 if (ret) {
851 pr_err("pblk: smeta I/O submission failed: %d\n", ret);
852 bio_put(bio);
853 goto free_ppa_list;
854 }
855
588726d3 856 atomic_dec(&pblk->inflight_io);
a4bd217b
JG
857
858 if (rqd.error) {
e2cddf20 859 if (dir == PBLK_WRITE)
a4bd217b 860 pblk_log_write_err(pblk, &rqd);
8f554597 861 else if (dir == PBLK_READ)
a4bd217b
JG
862 pblk_log_read_err(pblk, &rqd);
863 }
864
865free_ppa_list:
63e3809c 866 nvm_dev_dma_free(dev->parent, rqd.meta_list, rqd.dma_meta_list);
a4bd217b
JG
867
868 return ret;
869}
870
871int pblk_line_read_smeta(struct pblk *pblk, struct pblk_line *line)
872{
873 u64 bpaddr = pblk_line_smeta_start(pblk, line);
874
8f554597 875 return pblk_line_submit_smeta_io(pblk, line, bpaddr, PBLK_READ_RECOV);
a4bd217b
JG
876}
877
dd2a4343
JG
878int pblk_line_read_emeta(struct pblk *pblk, struct pblk_line *line,
879 void *emeta_buf)
a4bd217b 880{
dd2a4343 881 return pblk_line_submit_emeta_io(pblk, line, emeta_buf,
e2cddf20 882 line->emeta_ssec, PBLK_READ);
a4bd217b
JG
883}
884
885static void pblk_setup_e_rq(struct pblk *pblk, struct nvm_rq *rqd,
886 struct ppa_addr ppa)
887{
888 rqd->opcode = NVM_OP_ERASE;
889 rqd->ppa_addr = ppa;
890 rqd->nr_ppas = 1;
e2cddf20 891 rqd->flags = pblk_set_progr_mode(pblk, PBLK_ERASE);
a4bd217b
JG
892 rqd->bio = NULL;
893}
894
895static int pblk_blk_erase_sync(struct pblk *pblk, struct ppa_addr ppa)
896{
897 struct nvm_rq rqd;
588726d3 898 int ret = 0;
a4bd217b
JG
899
900 memset(&rqd, 0, sizeof(struct nvm_rq));
901
902 pblk_setup_e_rq(pblk, &rqd, ppa);
903
a4bd217b
JG
904 /* The write thread schedules erases so that it minimizes disturbances
905 * with writes. Thus, there is no need to take the LUN semaphore.
906 */
1a94b2d4 907 ret = pblk_submit_io_sync(pblk, &rqd);
a4bd217b
JG
908 if (ret) {
909 struct nvm_tgt_dev *dev = pblk->dev;
910 struct nvm_geo *geo = &dev->geo;
911
912 pr_err("pblk: could not sync erase line:%d,blk:%d\n",
b1bcfda1
JG
913 pblk_ppa_to_line(ppa),
914 pblk_ppa_to_pos(geo, ppa));
a4bd217b
JG
915
916 rqd.error = ret;
917 goto out;
918 }
919
a4bd217b
JG
920out:
921 rqd.private = pblk;
922 __pblk_end_io_erase(pblk, &rqd);
923
588726d3 924 return ret;
a4bd217b
JG
925}
926
927int pblk_line_erase(struct pblk *pblk, struct pblk_line *line)
928{
929 struct pblk_line_meta *lm = &pblk->lm;
930 struct ppa_addr ppa;
588726d3 931 int ret, bit = -1;
a4bd217b 932
a44f53fa
JG
933 /* Erase only good blocks, one at a time */
934 do {
935 spin_lock(&line->lock);
936 bit = find_next_zero_bit(line->erase_bitmap, lm->blk_per_line,
937 bit + 1);
938 if (bit >= lm->blk_per_line) {
939 spin_unlock(&line->lock);
940 break;
941 }
942
a4bd217b 943 ppa = pblk->luns[bit].bppa; /* set ch and lun */
69471513 944 ppa.a.blk = line->id;
a4bd217b 945
a44f53fa 946 atomic_dec(&line->left_eblks);
a4bd217b 947 WARN_ON(test_and_set_bit(bit, line->erase_bitmap));
a44f53fa 948 spin_unlock(&line->lock);
a4bd217b 949
588726d3
JG
950 ret = pblk_blk_erase_sync(pblk, ppa);
951 if (ret) {
a4bd217b 952 pr_err("pblk: failed to erase line %d\n", line->id);
588726d3 953 return ret;
a4bd217b 954 }
a44f53fa 955 } while (1);
a4bd217b
JG
956
957 return 0;
958}
959
dd2a4343
JG
960static void pblk_line_setup_metadata(struct pblk_line *line,
961 struct pblk_line_mgmt *l_mg,
962 struct pblk_line_meta *lm)
963{
964 int meta_line;
965
588726d3
JG
966 lockdep_assert_held(&l_mg->free_lock);
967
dd2a4343
JG
968retry_meta:
969 meta_line = find_first_zero_bit(&l_mg->meta_bitmap, PBLK_DATA_LINES);
970 if (meta_line == PBLK_DATA_LINES) {
971 spin_unlock(&l_mg->free_lock);
972 io_schedule();
973 spin_lock(&l_mg->free_lock);
974 goto retry_meta;
975 }
976
977 set_bit(meta_line, &l_mg->meta_bitmap);
978 line->meta_line = meta_line;
979
980 line->smeta = l_mg->sline_meta[meta_line];
981 line->emeta = l_mg->eline_meta[meta_line];
982
983 memset(line->smeta, 0, lm->smeta_len);
984 memset(line->emeta->buf, 0, lm->emeta_len[0]);
985
986 line->emeta->mem = 0;
987 atomic_set(&line->emeta->sync, 0);
988}
989
a4bd217b
JG
990/* For now lines are always assumed full lines. Thus, smeta former and current
991 * lun bitmaps are omitted.
992 */
dd2a4343 993static int pblk_line_init_metadata(struct pblk *pblk, struct pblk_line *line,
a4bd217b
JG
994 struct pblk_line *cur)
995{
996 struct nvm_tgt_dev *dev = pblk->dev;
997 struct nvm_geo *geo = &dev->geo;
998 struct pblk_line_meta *lm = &pblk->lm;
999 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
dd2a4343
JG
1000 struct pblk_emeta *emeta = line->emeta;
1001 struct line_emeta *emeta_buf = emeta->buf;
1002 struct line_smeta *smeta_buf = (struct line_smeta *)line->smeta;
a4bd217b
JG
1003 int nr_blk_line;
1004
1005 /* After erasing the line, new bad blocks might appear and we risk
1006 * having an invalid line
1007 */
1008 nr_blk_line = lm->blk_per_line -
1009 bitmap_weight(line->blk_bitmap, lm->blk_per_line);
1010 if (nr_blk_line < lm->min_blk_line) {
1011 spin_lock(&l_mg->free_lock);
1012 spin_lock(&line->lock);
1013 line->state = PBLK_LINESTATE_BAD;
1014 spin_unlock(&line->lock);
1015
1016 list_add_tail(&line->list, &l_mg->bad_list);
1017 spin_unlock(&l_mg->free_lock);
1018
1019 pr_debug("pblk: line %d is bad\n", line->id);
1020
1021 return 0;
1022 }
1023
1024 /* Run-time metadata */
dd2a4343 1025 line->lun_bitmap = ((void *)(smeta_buf)) + sizeof(struct line_smeta);
a4bd217b
JG
1026
1027 /* Mark LUNs allocated in this line (all for now) */
1028 bitmap_set(line->lun_bitmap, 0, lm->lun_bitmap_len);
1029
dd2a4343
JG
1030 smeta_buf->header.identifier = cpu_to_le32(PBLK_MAGIC);
1031 memcpy(smeta_buf->header.uuid, pblk->instance_uuid, 16);
1032 smeta_buf->header.id = cpu_to_le32(line->id);
1033 smeta_buf->header.type = cpu_to_le16(line->type);
d0ab0b1a
HH
1034 smeta_buf->header.version_major = SMETA_VERSION_MAJOR;
1035 smeta_buf->header.version_minor = SMETA_VERSION_MINOR;
a4bd217b
JG
1036
1037 /* Start metadata */
dd2a4343 1038 smeta_buf->seq_nr = cpu_to_le64(line->seq_nr);
fae7fae4 1039 smeta_buf->window_wr_lun = cpu_to_le32(geo->all_luns);
a4bd217b
JG
1040
1041 /* Fill metadata among lines */
1042 if (cur) {
1043 memcpy(line->lun_bitmap, cur->lun_bitmap, lm->lun_bitmap_len);
dd2a4343
JG
1044 smeta_buf->prev_id = cpu_to_le32(cur->id);
1045 cur->emeta->buf->next_id = cpu_to_le32(line->id);
a4bd217b 1046 } else {
dd2a4343 1047 smeta_buf->prev_id = cpu_to_le32(PBLK_LINE_EMPTY);
a4bd217b
JG
1048 }
1049
1050 /* All smeta must be set at this point */
dd2a4343
JG
1051 smeta_buf->header.crc = cpu_to_le32(
1052 pblk_calc_meta_header_crc(pblk, &smeta_buf->header));
1053 smeta_buf->crc = cpu_to_le32(pblk_calc_smeta_crc(pblk, smeta_buf));
a4bd217b
JG
1054
1055 /* End metadata */
dd2a4343
JG
1056 memcpy(&emeta_buf->header, &smeta_buf->header,
1057 sizeof(struct line_header));
d0ab0b1a
HH
1058
1059 emeta_buf->header.version_major = EMETA_VERSION_MAJOR;
1060 emeta_buf->header.version_minor = EMETA_VERSION_MINOR;
1061 emeta_buf->header.crc = cpu_to_le32(
1062 pblk_calc_meta_header_crc(pblk, &emeta_buf->header));
1063
dd2a4343
JG
1064 emeta_buf->seq_nr = cpu_to_le64(line->seq_nr);
1065 emeta_buf->nr_lbas = cpu_to_le64(line->sec_in_line);
1066 emeta_buf->nr_valid_lbas = cpu_to_le64(0);
1067 emeta_buf->next_id = cpu_to_le32(PBLK_LINE_EMPTY);
1068 emeta_buf->crc = cpu_to_le32(0);
1069 emeta_buf->prev_id = smeta_buf->prev_id;
a4bd217b
JG
1070
1071 return 1;
1072}
1073
1074/* For now lines are always assumed full lines. Thus, smeta former and current
1075 * lun bitmaps are omitted.
1076 */
1077static int pblk_line_init_bb(struct pblk *pblk, struct pblk_line *line,
1078 int init)
1079{
1080 struct nvm_tgt_dev *dev = pblk->dev;
1081 struct nvm_geo *geo = &dev->geo;
1082 struct pblk_line_meta *lm = &pblk->lm;
1083 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
a4bd217b
JG
1084 u64 off;
1085 int bit = -1;
cfe1c9e2 1086 int emeta_secs;
a4bd217b
JG
1087
1088 line->sec_in_line = lm->sec_per_line;
1089
1090 /* Capture bad block information on line mapping bitmaps */
1091 while ((bit = find_next_bit(line->blk_bitmap, lm->blk_per_line,
1092 bit + 1)) < lm->blk_per_line) {
e46f4e48 1093 off = bit * geo->ws_opt;
a4bd217b
JG
1094 bitmap_shift_left(l_mg->bb_aux, l_mg->bb_template, off,
1095 lm->sec_per_line);
1096 bitmap_or(line->map_bitmap, line->map_bitmap, l_mg->bb_aux,
1097 lm->sec_per_line);
e46f4e48 1098 line->sec_in_line -= geo->clba;
a4bd217b
JG
1099 }
1100
1101 /* Mark smeta metadata sectors as bad sectors */
1102 bit = find_first_zero_bit(line->blk_bitmap, lm->blk_per_line);
e46f4e48 1103 off = bit * geo->ws_opt;
a4bd217b
JG
1104 bitmap_set(line->map_bitmap, off, lm->smeta_sec);
1105 line->sec_in_line -= lm->smeta_sec;
1106 line->smeta_ssec = off;
1107 line->cur_sec = off + lm->smeta_sec;
1108
e2cddf20 1109 if (init && pblk_line_submit_smeta_io(pblk, line, off, PBLK_WRITE)) {
a4bd217b 1110 pr_debug("pblk: line smeta I/O failed. Retry\n");
588726d3 1111 return 1;
a4bd217b
JG
1112 }
1113
1114 bitmap_copy(line->invalid_bitmap, line->map_bitmap, lm->sec_per_line);
1115
1116 /* Mark emeta metadata sectors as bad sectors. We need to consider bad
1117 * blocks to make sure that there are enough sectors to store emeta
1118 */
cfe1c9e2
HH
1119 emeta_secs = lm->emeta_sec[0];
1120 off = lm->sec_per_line;
1121 while (emeta_secs) {
e46f4e48 1122 off -= geo->ws_opt;
a4bd217b 1123 if (!test_bit(off, line->invalid_bitmap)) {
e46f4e48
JG
1124 bitmap_set(line->invalid_bitmap, off, geo->ws_opt);
1125 emeta_secs -= geo->ws_opt;
a4bd217b
JG
1126 }
1127 }
1128
a4bd217b 1129 line->emeta_ssec = off;
cfe1c9e2 1130 line->sec_in_line -= lm->emeta_sec[0];
dd2a4343 1131 line->nr_valid_lbas = 0;
0880a9aa 1132 line->left_msecs = line->sec_in_line;
dd2a4343 1133 *line->vsc = cpu_to_le32(line->sec_in_line);
a4bd217b
JG
1134
1135 if (lm->sec_per_line - line->sec_in_line !=
1136 bitmap_weight(line->invalid_bitmap, lm->sec_per_line)) {
1137 spin_lock(&line->lock);
1138 line->state = PBLK_LINESTATE_BAD;
1139 spin_unlock(&line->lock);
1140
1141 list_add_tail(&line->list, &l_mg->bad_list);
1142 pr_err("pblk: unexpected line %d is bad\n", line->id);
1143
1144 return 0;
1145 }
1146
1147 return 1;
1148}
1149
32ef9412
JG
1150static int pblk_prepare_new_line(struct pblk *pblk, struct pblk_line *line)
1151{
1152 struct pblk_line_meta *lm = &pblk->lm;
1153 struct nvm_tgt_dev *dev = pblk->dev;
1154 struct nvm_geo *geo = &dev->geo;
1155 int blk_to_erase = atomic_read(&line->blk_in_line);
1156 int i;
1157
1158 for (i = 0; i < lm->blk_per_line; i++) {
1159 struct pblk_lun *rlun = &pblk->luns[i];
1160 int pos = pblk_ppa_to_pos(geo, rlun->bppa);
1161 int state = line->chks[pos].state;
1162
1163 /* Free chunks should not be erased */
1164 if (state & NVM_CHK_ST_FREE) {
1165 set_bit(pblk_ppa_to_pos(geo, rlun->bppa),
1166 line->erase_bitmap);
1167 blk_to_erase--;
1168 }
1169 }
1170
1171 return blk_to_erase;
1172}
1173
a4bd217b
JG
1174static int pblk_line_prepare(struct pblk *pblk, struct pblk_line *line)
1175{
1176 struct pblk_line_meta *lm = &pblk->lm;
32ef9412 1177 int blk_to_erase;
a4bd217b 1178
e72ec1d3 1179 line->map_bitmap = kzalloc(lm->sec_bitmap_len, GFP_ATOMIC);
a4bd217b
JG
1180 if (!line->map_bitmap)
1181 return -ENOMEM;
a4bd217b 1182
e72ec1d3
JG
1183 /* will be initialized using bb info from map_bitmap */
1184 line->invalid_bitmap = kmalloc(lm->sec_bitmap_len, GFP_ATOMIC);
a4bd217b 1185 if (!line->invalid_bitmap) {
e72ec1d3 1186 kfree(line->map_bitmap);
a4bd217b
JG
1187 return -ENOMEM;
1188 }
1189
32ef9412
JG
1190 /* Bad blocks do not need to be erased */
1191 bitmap_copy(line->erase_bitmap, line->blk_bitmap, lm->blk_per_line);
1192
a4bd217b 1193 spin_lock(&line->lock);
32ef9412
JG
1194
1195 /* If we have not written to this line, we need to mark up free chunks
1196 * as already erased
1197 */
1198 if (line->state == PBLK_LINESTATE_NEW) {
1199 blk_to_erase = pblk_prepare_new_line(pblk, line);
1200 line->state = PBLK_LINESTATE_FREE;
1201 } else {
1202 blk_to_erase = atomic_read(&line->blk_in_line);
1203 }
1204
a4bd217b 1205 if (line->state != PBLK_LINESTATE_FREE) {
e72ec1d3
JG
1206 kfree(line->map_bitmap);
1207 kfree(line->invalid_bitmap);
a4bd217b 1208 spin_unlock(&line->lock);
588726d3
JG
1209 WARN(1, "pblk: corrupted line %d, state %d\n",
1210 line->id, line->state);
1211 return -EAGAIN;
a4bd217b 1212 }
588726d3 1213
a4bd217b 1214 line->state = PBLK_LINESTATE_OPEN;
a44f53fa 1215
32ef9412
JG
1216 atomic_set(&line->left_eblks, blk_to_erase);
1217 atomic_set(&line->left_seblks, blk_to_erase);
dd2a4343
JG
1218
1219 line->meta_distance = lm->meta_distance;
a4bd217b
JG
1220 spin_unlock(&line->lock);
1221
a4bd217b
JG
1222 kref_init(&line->ref);
1223
1224 return 0;
1225}
1226
1227int pblk_line_recov_alloc(struct pblk *pblk, struct pblk_line *line)
1228{
1229 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1230 int ret;
1231
1232 spin_lock(&l_mg->free_lock);
1233 l_mg->data_line = line;
1234 list_del(&line->list);
a4bd217b
JG
1235
1236 ret = pblk_line_prepare(pblk, line);
1237 if (ret) {
1238 list_add(&line->list, &l_mg->free_list);
3dc001f3 1239 spin_unlock(&l_mg->free_lock);
a4bd217b
JG
1240 return ret;
1241 }
3dc001f3 1242 spin_unlock(&l_mg->free_lock);
a4bd217b 1243
a7689938 1244 pblk_rl_free_lines_dec(&pblk->rl, line, true);
a4bd217b
JG
1245
1246 if (!pblk_line_init_bb(pblk, line, 0)) {
1247 list_add(&line->list, &l_mg->free_list);
1248 return -EINTR;
1249 }
1250
1251 return 0;
1252}
1253
1254void pblk_line_recov_close(struct pblk *pblk, struct pblk_line *line)
1255{
e72ec1d3 1256 kfree(line->map_bitmap);
a4bd217b
JG
1257 line->map_bitmap = NULL;
1258 line->smeta = NULL;
1259 line->emeta = NULL;
1260}
1261
1262struct pblk_line *pblk_line_get(struct pblk *pblk)
1263{
1264 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1265 struct pblk_line_meta *lm = &pblk->lm;
588726d3
JG
1266 struct pblk_line *line;
1267 int ret, bit;
a4bd217b
JG
1268
1269 lockdep_assert_held(&l_mg->free_lock);
1270
588726d3 1271retry:
a4bd217b
JG
1272 if (list_empty(&l_mg->free_list)) {
1273 pr_err("pblk: no free lines\n");
588726d3 1274 return NULL;
a4bd217b
JG
1275 }
1276
1277 line = list_first_entry(&l_mg->free_list, struct pblk_line, list);
1278 list_del(&line->list);
1279 l_mg->nr_free_lines--;
1280
1281 bit = find_first_zero_bit(line->blk_bitmap, lm->blk_per_line);
1282 if (unlikely(bit >= lm->blk_per_line)) {
1283 spin_lock(&line->lock);
1284 line->state = PBLK_LINESTATE_BAD;
1285 spin_unlock(&line->lock);
1286
1287 list_add_tail(&line->list, &l_mg->bad_list);
1288
1289 pr_debug("pblk: line %d is bad\n", line->id);
588726d3 1290 goto retry;
a4bd217b
JG
1291 }
1292
588726d3
JG
1293 ret = pblk_line_prepare(pblk, line);
1294 if (ret) {
1295 if (ret == -EAGAIN) {
1296 list_add(&line->list, &l_mg->corrupt_list);
1297 goto retry;
1298 } else {
1299 pr_err("pblk: failed to prepare line %d\n", line->id);
1300 list_add(&line->list, &l_mg->free_list);
1301 l_mg->nr_free_lines++;
1302 return NULL;
1303 }
a4bd217b
JG
1304 }
1305
a4bd217b
JG
1306 return line;
1307}
1308
1309static struct pblk_line *pblk_line_retry(struct pblk *pblk,
1310 struct pblk_line *line)
1311{
1312 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1313 struct pblk_line *retry_line;
1314
588726d3 1315retry:
a4bd217b
JG
1316 spin_lock(&l_mg->free_lock);
1317 retry_line = pblk_line_get(pblk);
1318 if (!retry_line) {
be388d9f 1319 l_mg->data_line = NULL;
a4bd217b
JG
1320 spin_unlock(&l_mg->free_lock);
1321 return NULL;
1322 }
1323
1324 retry_line->smeta = line->smeta;
1325 retry_line->emeta = line->emeta;
1326 retry_line->meta_line = line->meta_line;
a4bd217b 1327
be388d9f 1328 pblk_line_free(pblk, line);
3dc001f3 1329 l_mg->data_line = retry_line;
a4bd217b
JG
1330 spin_unlock(&l_mg->free_lock);
1331
a7689938 1332 pblk_rl_free_lines_dec(&pblk->rl, line, false);
a4bd217b 1333
588726d3
JG
1334 if (pblk_line_erase(pblk, retry_line))
1335 goto retry;
1336
a4bd217b
JG
1337 return retry_line;
1338}
1339
588726d3
JG
1340static void pblk_set_space_limit(struct pblk *pblk)
1341{
1342 struct pblk_rl *rl = &pblk->rl;
1343
1344 atomic_set(&rl->rb_space, 0);
1345}
1346
a4bd217b
JG
1347struct pblk_line *pblk_line_get_first_data(struct pblk *pblk)
1348{
1349 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1350 struct pblk_line *line;
a4bd217b
JG
1351
1352 spin_lock(&l_mg->free_lock);
1353 line = pblk_line_get(pblk);
1354 if (!line) {
1355 spin_unlock(&l_mg->free_lock);
1356 return NULL;
1357 }
1358
1359 line->seq_nr = l_mg->d_seq_nr++;
1360 line->type = PBLK_LINETYPE_DATA;
1361 l_mg->data_line = line;
1362
dd2a4343 1363 pblk_line_setup_metadata(line, l_mg, &pblk->lm);
a4bd217b
JG
1364
1365 /* Allocate next line for preparation */
1366 l_mg->data_next = pblk_line_get(pblk);
588726d3
JG
1367 if (!l_mg->data_next) {
1368 /* If we cannot get a new line, we need to stop the pipeline.
1369 * Only allow as many writes in as we can store safely and then
1370 * fail gracefully
1371 */
1372 pblk_set_space_limit(pblk);
1373
1374 l_mg->data_next = NULL;
1375 } else {
a4bd217b
JG
1376 l_mg->data_next->seq_nr = l_mg->d_seq_nr++;
1377 l_mg->data_next->type = PBLK_LINETYPE_DATA;
a4bd217b
JG
1378 }
1379 spin_unlock(&l_mg->free_lock);
1380
588726d3
JG
1381 if (pblk_line_erase(pblk, line)) {
1382 line = pblk_line_retry(pblk, line);
1383 if (!line)
1384 return NULL;
1385 }
1386
a4bd217b 1387retry_setup:
dd2a4343 1388 if (!pblk_line_init_metadata(pblk, line, NULL)) {
a4bd217b
JG
1389 line = pblk_line_retry(pblk, line);
1390 if (!line)
1391 return NULL;
1392
1393 goto retry_setup;
1394 }
1395
1396 if (!pblk_line_init_bb(pblk, line, 1)) {
1397 line = pblk_line_retry(pblk, line);
1398 if (!line)
1399 return NULL;
1400
1401 goto retry_setup;
1402 }
1403
a7689938
JG
1404 pblk_rl_free_lines_dec(&pblk->rl, line, true);
1405
a4bd217b
JG
1406 return line;
1407}
1408
588726d3
JG
1409static void pblk_stop_writes(struct pblk *pblk, struct pblk_line *line)
1410{
1411 lockdep_assert_held(&pblk->l_mg.free_lock);
1412
1413 pblk_set_space_limit(pblk);
1414 pblk->state = PBLK_STATE_STOPPING;
1415}
1416
8bd40020
JG
1417static void pblk_line_close_meta_sync(struct pblk *pblk)
1418{
1419 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1420 struct pblk_line_meta *lm = &pblk->lm;
1421 struct pblk_line *line, *tline;
1422 LIST_HEAD(list);
1423
1424 spin_lock(&l_mg->close_lock);
1425 if (list_empty(&l_mg->emeta_list)) {
1426 spin_unlock(&l_mg->close_lock);
1427 return;
1428 }
1429
1430 list_cut_position(&list, &l_mg->emeta_list, l_mg->emeta_list.prev);
1431 spin_unlock(&l_mg->close_lock);
1432
1433 list_for_each_entry_safe(line, tline, &list, list) {
1434 struct pblk_emeta *emeta = line->emeta;
1435
1436 while (emeta->mem < lm->emeta_len[0]) {
1437 int ret;
1438
1439 ret = pblk_submit_meta_io(pblk, line);
1440 if (ret) {
1441 pr_err("pblk: sync meta line %d failed (%d)\n",
1442 line->id, ret);
1443 return;
1444 }
1445 }
1446 }
1447
1448 pblk_wait_for_meta(pblk);
1449 flush_workqueue(pblk->close_wq);
1450}
1451
588726d3
JG
1452void pblk_pipeline_stop(struct pblk *pblk)
1453{
1454 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1455 int ret;
1456
1457 spin_lock(&l_mg->free_lock);
1458 if (pblk->state == PBLK_STATE_RECOVERING ||
1459 pblk->state == PBLK_STATE_STOPPED) {
1460 spin_unlock(&l_mg->free_lock);
1461 return;
1462 }
1463 pblk->state = PBLK_STATE_RECOVERING;
1464 spin_unlock(&l_mg->free_lock);
1465
1466 pblk_flush_writer(pblk);
1467 pblk_wait_for_meta(pblk);
1468
1469 ret = pblk_recov_pad(pblk);
1470 if (ret) {
1471 pr_err("pblk: could not close data on teardown(%d)\n", ret);
1472 return;
1473 }
1474
ee8d5c1a 1475 flush_workqueue(pblk->bb_wq);
588726d3
JG
1476 pblk_line_close_meta_sync(pblk);
1477
1478 spin_lock(&l_mg->free_lock);
1479 pblk->state = PBLK_STATE_STOPPED;
1480 l_mg->data_line = NULL;
1481 l_mg->data_next = NULL;
1482 spin_unlock(&l_mg->free_lock);
1483}
1484
21d22871 1485struct pblk_line *pblk_line_replace_data(struct pblk *pblk)
a4bd217b 1486{
a4bd217b 1487 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
21d22871 1488 struct pblk_line *cur, *new = NULL;
a4bd217b 1489 unsigned int left_seblks;
a4bd217b
JG
1490
1491 cur = l_mg->data_line;
1492 new = l_mg->data_next;
1493 if (!new)
21d22871 1494 goto out;
a4bd217b
JG
1495 l_mg->data_line = new;
1496
588726d3 1497 spin_lock(&l_mg->free_lock);
588726d3
JG
1498 pblk_line_setup_metadata(new, l_mg, &pblk->lm);
1499 spin_unlock(&l_mg->free_lock);
1500
1501retry_erase:
a4bd217b
JG
1502 left_seblks = atomic_read(&new->left_seblks);
1503 if (left_seblks) {
1504 /* If line is not fully erased, erase it */
a44f53fa 1505 if (atomic_read(&new->left_eblks)) {
a4bd217b 1506 if (pblk_line_erase(pblk, new))
21d22871 1507 goto out;
a4bd217b
JG
1508 } else {
1509 io_schedule();
1510 }
588726d3 1511 goto retry_erase;
a4bd217b
JG
1512 }
1513
a4bd217b 1514retry_setup:
dd2a4343 1515 if (!pblk_line_init_metadata(pblk, new, cur)) {
a4bd217b 1516 new = pblk_line_retry(pblk, new);
f3236cef 1517 if (!new)
21d22871 1518 goto out;
a4bd217b
JG
1519
1520 goto retry_setup;
1521 }
1522
1523 if (!pblk_line_init_bb(pblk, new, 1)) {
1524 new = pblk_line_retry(pblk, new);
1525 if (!new)
21d22871 1526 goto out;
a4bd217b
JG
1527
1528 goto retry_setup;
1529 }
1530
a7689938
JG
1531 pblk_rl_free_lines_dec(&pblk->rl, new, true);
1532
588726d3
JG
1533 /* Allocate next line for preparation */
1534 spin_lock(&l_mg->free_lock);
1535 l_mg->data_next = pblk_line_get(pblk);
1536 if (!l_mg->data_next) {
1537 /* If we cannot get a new line, we need to stop the pipeline.
1538 * Only allow as many writes in as we can store safely and then
1539 * fail gracefully
1540 */
1541 pblk_stop_writes(pblk, new);
1542 l_mg->data_next = NULL;
1543 } else {
1544 l_mg->data_next->seq_nr = l_mg->d_seq_nr++;
1545 l_mg->data_next->type = PBLK_LINETYPE_DATA;
588726d3
JG
1546 }
1547 spin_unlock(&l_mg->free_lock);
1548
21d22871
JG
1549out:
1550 return new;
a4bd217b
JG
1551}
1552
1553void pblk_line_free(struct pblk *pblk, struct pblk_line *line)
1554{
e72ec1d3
JG
1555 kfree(line->map_bitmap);
1556 kfree(line->invalid_bitmap);
a4bd217b 1557
dd2a4343
JG
1558 *line->vsc = cpu_to_le32(EMPTY_ENTRY);
1559
a4bd217b
JG
1560 line->map_bitmap = NULL;
1561 line->invalid_bitmap = NULL;
be388d9f
JG
1562 line->smeta = NULL;
1563 line->emeta = NULL;
a4bd217b
JG
1564}
1565
7bd4d370 1566static void __pblk_line_put(struct pblk *pblk, struct pblk_line *line)
a4bd217b 1567{
a4bd217b 1568 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
d6b992f7 1569 struct pblk_gc *gc = &pblk->gc;
a4bd217b
JG
1570
1571 spin_lock(&line->lock);
1572 WARN_ON(line->state != PBLK_LINESTATE_GC);
1573 line->state = PBLK_LINESTATE_FREE;
1574 line->gc_group = PBLK_LINEGC_NONE;
1575 pblk_line_free(pblk, line);
1576 spin_unlock(&line->lock);
1577
d6b992f7
HH
1578 atomic_dec(&gc->pipeline_gc);
1579
a4bd217b
JG
1580 spin_lock(&l_mg->free_lock);
1581 list_add_tail(&line->list, &l_mg->free_list);
1582 l_mg->nr_free_lines++;
1583 spin_unlock(&l_mg->free_lock);
1584
1585 pblk_rl_free_lines_inc(&pblk->rl, line);
1586}
1587
7bd4d370
JG
1588static void pblk_line_put_ws(struct work_struct *work)
1589{
1590 struct pblk_line_ws *line_put_ws = container_of(work,
1591 struct pblk_line_ws, ws);
1592 struct pblk *pblk = line_put_ws->pblk;
1593 struct pblk_line *line = line_put_ws->line;
1594
1595 __pblk_line_put(pblk, line);
b906bbb6 1596 mempool_free(line_put_ws, &pblk->gen_ws_pool);
7bd4d370
JG
1597}
1598
1599void pblk_line_put(struct kref *ref)
1600{
1601 struct pblk_line *line = container_of(ref, struct pblk_line, ref);
1602 struct pblk *pblk = line->pblk;
1603
1604 __pblk_line_put(pblk, line);
1605}
1606
1607void pblk_line_put_wq(struct kref *ref)
1608{
1609 struct pblk_line *line = container_of(ref, struct pblk_line, ref);
1610 struct pblk *pblk = line->pblk;
1611 struct pblk_line_ws *line_put_ws;
1612
b906bbb6 1613 line_put_ws = mempool_alloc(&pblk->gen_ws_pool, GFP_ATOMIC);
7bd4d370
JG
1614 if (!line_put_ws)
1615 return;
1616
1617 line_put_ws->pblk = pblk;
1618 line_put_ws->line = line;
1619 line_put_ws->priv = NULL;
1620
1621 INIT_WORK(&line_put_ws->ws, pblk_line_put_ws);
1622 queue_work(pblk->r_end_wq, &line_put_ws->ws);
1623}
1624
a4bd217b
JG
1625int pblk_blk_erase_async(struct pblk *pblk, struct ppa_addr ppa)
1626{
1627 struct nvm_rq *rqd;
1628 int err;
1629
67bf26a3 1630 rqd = pblk_alloc_rqd(pblk, PBLK_ERASE);
a4bd217b
JG
1631
1632 pblk_setup_e_rq(pblk, rqd, ppa);
1633
1634 rqd->end_io = pblk_end_io_erase;
1635 rqd->private = pblk;
1636
1637 /* The write thread schedules erases so that it minimizes disturbances
1638 * with writes. Thus, there is no need to take the LUN semaphore.
1639 */
1640 err = pblk_submit_io(pblk, rqd);
1641 if (err) {
1642 struct nvm_tgt_dev *dev = pblk->dev;
1643 struct nvm_geo *geo = &dev->geo;
1644
1645 pr_err("pblk: could not async erase line:%d,blk:%d\n",
b1bcfda1
JG
1646 pblk_ppa_to_line(ppa),
1647 pblk_ppa_to_pos(geo, ppa));
a4bd217b
JG
1648 }
1649
1650 return err;
1651}
1652
1653struct pblk_line *pblk_line_get_data(struct pblk *pblk)
1654{
1655 return pblk->l_mg.data_line;
1656}
1657
d624f371
JG
1658/* For now, always erase next line */
1659struct pblk_line *pblk_line_get_erase(struct pblk *pblk)
a4bd217b
JG
1660{
1661 return pblk->l_mg.data_next;
1662}
1663
1664int pblk_line_is_full(struct pblk_line *line)
1665{
1666 return (line->left_msecs == 0);
1667}
1668
588726d3
JG
1669static void pblk_line_should_sync_meta(struct pblk *pblk)
1670{
1671 if (pblk_rl_is_limit(&pblk->rl))
1672 pblk_line_close_meta_sync(pblk);
1673}
1674
a4bd217b
JG
1675void pblk_line_close(struct pblk *pblk, struct pblk_line *line)
1676{
32ef9412
JG
1677 struct nvm_tgt_dev *dev = pblk->dev;
1678 struct nvm_geo *geo = &dev->geo;
1679 struct pblk_line_meta *lm = &pblk->lm;
a4bd217b
JG
1680 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1681 struct list_head *move_list;
32ef9412 1682 int i;
a4bd217b 1683
a84ebb83 1684#ifdef CONFIG_NVM_DEBUG
dd2a4343 1685 WARN(!bitmap_full(line->map_bitmap, lm->sec_per_line),
a4bd217b 1686 "pblk: corrupt closed line %d\n", line->id);
a84ebb83 1687#endif
a4bd217b
JG
1688
1689 spin_lock(&l_mg->free_lock);
1690 WARN_ON(!test_and_clear_bit(line->meta_line, &l_mg->meta_bitmap));
1691 spin_unlock(&l_mg->free_lock);
1692
1693 spin_lock(&l_mg->gc_lock);
1694 spin_lock(&line->lock);
1695 WARN_ON(line->state != PBLK_LINESTATE_OPEN);
1696 line->state = PBLK_LINESTATE_CLOSED;
1697 move_list = pblk_line_gc_list(pblk, line);
1698
1699 list_add_tail(&line->list, move_list);
1700
e72ec1d3 1701 kfree(line->map_bitmap);
a4bd217b
JG
1702 line->map_bitmap = NULL;
1703 line->smeta = NULL;
1704 line->emeta = NULL;
1705
32ef9412
JG
1706 for (i = 0; i < lm->blk_per_line; i++) {
1707 struct pblk_lun *rlun = &pblk->luns[i];
1708 int pos = pblk_ppa_to_pos(geo, rlun->bppa);
1709 int state = line->chks[pos].state;
1710
1711 if (!(state & NVM_CHK_ST_OFFLINE))
1712 state = NVM_CHK_ST_CLOSED;
1713 }
1714
a4bd217b
JG
1715 spin_unlock(&line->lock);
1716 spin_unlock(&l_mg->gc_lock);
1717}
1718
dd2a4343
JG
1719void pblk_line_close_meta(struct pblk *pblk, struct pblk_line *line)
1720{
1721 struct pblk_line_mgmt *l_mg = &pblk->l_mg;
1722 struct pblk_line_meta *lm = &pblk->lm;
1723 struct pblk_emeta *emeta = line->emeta;
1724 struct line_emeta *emeta_buf = emeta->buf;
76758390 1725 struct wa_counters *wa = emeta_to_wa(lm, emeta_buf);
dd2a4343 1726
588726d3 1727 /* No need for exact vsc value; avoid a big line lock and take aprox. */
dd2a4343
JG
1728 memcpy(emeta_to_vsc(pblk, emeta_buf), l_mg->vsc_list, lm->vsc_list_len);
1729 memcpy(emeta_to_bb(emeta_buf), line->blk_bitmap, lm->blk_bitmap_len);
1730
76758390
HH
1731 wa->user = cpu_to_le64(atomic64_read(&pblk->user_wa));
1732 wa->pad = cpu_to_le64(atomic64_read(&pblk->pad_wa));
1733 wa->gc = cpu_to_le64(atomic64_read(&pblk->gc_wa));
1734
dd2a4343
JG
1735 emeta_buf->nr_valid_lbas = cpu_to_le64(line->nr_valid_lbas);
1736 emeta_buf->crc = cpu_to_le32(pblk_calc_emeta_crc(pblk, emeta_buf));
1737
1738 spin_lock(&l_mg->close_lock);
1739 spin_lock(&line->lock);
1740 list_add_tail(&line->list, &l_mg->emeta_list);
1741 spin_unlock(&line->lock);
1742 spin_unlock(&l_mg->close_lock);
588726d3
JG
1743
1744 pblk_line_should_sync_meta(pblk);
dd2a4343
JG
1745}
1746
a4bd217b
JG
1747void pblk_line_close_ws(struct work_struct *work)
1748{
1749 struct pblk_line_ws *line_ws = container_of(work, struct pblk_line_ws,
1750 ws);
1751 struct pblk *pblk = line_ws->pblk;
1752 struct pblk_line *line = line_ws->line;
1753
1754 pblk_line_close(pblk, line);
b906bbb6 1755 mempool_free(line_ws, &pblk->gen_ws_pool);
a4bd217b
JG
1756}
1757
b84ae4a8
JG
1758void pblk_gen_run_ws(struct pblk *pblk, struct pblk_line *line, void *priv,
1759 void (*work)(struct work_struct *), gfp_t gfp_mask,
ef576494 1760 struct workqueue_struct *wq)
a4bd217b
JG
1761{
1762 struct pblk_line_ws *line_ws;
1763
b906bbb6 1764 line_ws = mempool_alloc(&pblk->gen_ws_pool, gfp_mask);
a4bd217b
JG
1765
1766 line_ws->pblk = pblk;
1767 line_ws->line = line;
1768 line_ws->priv = priv;
1769
1770 INIT_WORK(&line_ws->ws, work);
ef576494 1771 queue_work(wq, &line_ws->ws);
a4bd217b
JG
1772}
1773
3eaa11e2
JG
1774static void __pblk_down_page(struct pblk *pblk, struct ppa_addr *ppa_list,
1775 int nr_ppas, int pos)
a4bd217b 1776{
3eaa11e2 1777 struct pblk_lun *rlun = &pblk->luns[pos];
a4bd217b
JG
1778 int ret;
1779
1780 /*
1781 * Only send one inflight I/O per LUN. Since we map at a page
1782 * granurality, all ppas in the I/O will map to the same LUN
1783 */
1784#ifdef CONFIG_NVM_DEBUG
1785 int i;
1786
1787 for (i = 1; i < nr_ppas; i++)
69471513
JG
1788 WARN_ON(ppa_list[0].a.lun != ppa_list[i].a.lun ||
1789 ppa_list[0].a.ch != ppa_list[i].a.ch);
a4bd217b 1790#endif
a4bd217b 1791
3eaa11e2 1792 ret = down_timeout(&rlun->wr_sem, msecs_to_jiffies(30000));
c5493845
RP
1793 if (ret == -ETIME || ret == -EINTR)
1794 pr_err("pblk: taking lun semaphore timed out: err %d\n", -ret);
a4bd217b
JG
1795}
1796
3eaa11e2
JG
1797void pblk_down_page(struct pblk *pblk, struct ppa_addr *ppa_list, int nr_ppas)
1798{
1799 struct nvm_tgt_dev *dev = pblk->dev;
1800 struct nvm_geo *geo = &dev->geo;
1801 int pos = pblk_ppa_to_pos(geo, ppa_list[0]);
1802
1803 __pblk_down_page(pblk, ppa_list, nr_ppas, pos);
1804}
1805
1806void pblk_down_rq(struct pblk *pblk, struct ppa_addr *ppa_list, int nr_ppas,
1807 unsigned long *lun_bitmap)
1808{
1809 struct nvm_tgt_dev *dev = pblk->dev;
1810 struct nvm_geo *geo = &dev->geo;
1811 int pos = pblk_ppa_to_pos(geo, ppa_list[0]);
1812
1813 /* If the LUN has been locked for this same request, do no attempt to
1814 * lock it again
1815 */
1816 if (test_and_set_bit(pos, lun_bitmap))
1817 return;
1818
1819 __pblk_down_page(pblk, ppa_list, nr_ppas, pos);
1820}
1821
1822void pblk_up_page(struct pblk *pblk, struct ppa_addr *ppa_list, int nr_ppas)
1823{
1824 struct nvm_tgt_dev *dev = pblk->dev;
1825 struct nvm_geo *geo = &dev->geo;
1826 struct pblk_lun *rlun;
1827 int pos = pblk_ppa_to_pos(geo, ppa_list[0]);
1828
1829#ifdef CONFIG_NVM_DEBUG
1830 int i;
1831
1832 for (i = 1; i < nr_ppas; i++)
69471513
JG
1833 WARN_ON(ppa_list[0].a.lun != ppa_list[i].a.lun ||
1834 ppa_list[0].a.ch != ppa_list[i].a.ch);
3eaa11e2
JG
1835#endif
1836
1837 rlun = &pblk->luns[pos];
1838 up(&rlun->wr_sem);
1839}
1840
a4bd217b
JG
1841void pblk_up_rq(struct pblk *pblk, struct ppa_addr *ppa_list, int nr_ppas,
1842 unsigned long *lun_bitmap)
1843{
1844 struct nvm_tgt_dev *dev = pblk->dev;
1845 struct nvm_geo *geo = &dev->geo;
1846 struct pblk_lun *rlun;
a40afad9 1847 int num_lun = geo->all_luns;
a4bd217b
JG
1848 int bit = -1;
1849
a40afad9 1850 while ((bit = find_next_bit(lun_bitmap, num_lun, bit + 1)) < num_lun) {
a4bd217b
JG
1851 rlun = &pblk->luns[bit];
1852 up(&rlun->wr_sem);
1853 }
a4bd217b
JG
1854}
1855
1856void pblk_update_map(struct pblk *pblk, sector_t lba, struct ppa_addr ppa)
1857{
9f6cb13b 1858 struct ppa_addr ppa_l2p;
a4bd217b
JG
1859
1860 /* logic error: lba out-of-bounds. Ignore update */
1861 if (!(lba < pblk->rl.nr_secs)) {
1862 WARN(1, "pblk: corrupted L2P map request\n");
1863 return;
1864 }
1865
1866 spin_lock(&pblk->trans_lock);
9f6cb13b 1867 ppa_l2p = pblk_trans_map_get(pblk, lba);
a4bd217b 1868
9f6cb13b
JG
1869 if (!pblk_addr_in_cache(ppa_l2p) && !pblk_ppa_empty(ppa_l2p))
1870 pblk_map_invalidate(pblk, ppa_l2p);
a4bd217b
JG
1871
1872 pblk_trans_map_set(pblk, lba, ppa);
1873 spin_unlock(&pblk->trans_lock);
1874}
1875
1876void pblk_update_map_cache(struct pblk *pblk, sector_t lba, struct ppa_addr ppa)
1877{
d340121e 1878
a4bd217b
JG
1879#ifdef CONFIG_NVM_DEBUG
1880 /* Callers must ensure that the ppa points to a cache address */
1881 BUG_ON(!pblk_addr_in_cache(ppa));
1882 BUG_ON(pblk_rb_pos_oob(&pblk->rwb, pblk_addr_to_cacheline(ppa)));
1883#endif
1884
1885 pblk_update_map(pblk, lba, ppa);
1886}
1887
9f6cb13b 1888int pblk_update_map_gc(struct pblk *pblk, sector_t lba, struct ppa_addr ppa_new,
d340121e 1889 struct pblk_line *gc_line, u64 paddr_gc)
a4bd217b 1890{
d340121e 1891 struct ppa_addr ppa_l2p, ppa_gc;
a4bd217b
JG
1892 int ret = 1;
1893
1894#ifdef CONFIG_NVM_DEBUG
1895 /* Callers must ensure that the ppa points to a cache address */
9f6cb13b
JG
1896 BUG_ON(!pblk_addr_in_cache(ppa_new));
1897 BUG_ON(pblk_rb_pos_oob(&pblk->rwb, pblk_addr_to_cacheline(ppa_new)));
a4bd217b
JG
1898#endif
1899
1900 /* logic error: lba out-of-bounds. Ignore update */
1901 if (!(lba < pblk->rl.nr_secs)) {
1902 WARN(1, "pblk: corrupted L2P map request\n");
1903 return 0;
1904 }
1905
1906 spin_lock(&pblk->trans_lock);
9f6cb13b 1907 ppa_l2p = pblk_trans_map_get(pblk, lba);
d340121e 1908 ppa_gc = addr_to_gen_ppa(pblk, paddr_gc, gc_line->id);
a4bd217b 1909
d340121e
JG
1910 if (!pblk_ppa_comp(ppa_l2p, ppa_gc)) {
1911 spin_lock(&gc_line->lock);
1912 WARN(!test_bit(paddr_gc, gc_line->invalid_bitmap),
1913 "pblk: corrupted GC update");
1914 spin_unlock(&gc_line->lock);
9f6cb13b 1915
a4bd217b
JG
1916 ret = 0;
1917 goto out;
1918 }
1919
9f6cb13b 1920 pblk_trans_map_set(pblk, lba, ppa_new);
a4bd217b
JG
1921out:
1922 spin_unlock(&pblk->trans_lock);
1923 return ret;
1924}
1925
9f6cb13b
JG
1926void pblk_update_map_dev(struct pblk *pblk, sector_t lba,
1927 struct ppa_addr ppa_mapped, struct ppa_addr ppa_cache)
a4bd217b 1928{
9f6cb13b 1929 struct ppa_addr ppa_l2p;
a4bd217b
JG
1930
1931#ifdef CONFIG_NVM_DEBUG
1932 /* Callers must ensure that the ppa points to a device address */
9f6cb13b 1933 BUG_ON(pblk_addr_in_cache(ppa_mapped));
a4bd217b
JG
1934#endif
1935 /* Invalidate and discard padded entries */
1936 if (lba == ADDR_EMPTY) {
76758390 1937 atomic64_inc(&pblk->pad_wa);
a4bd217b
JG
1938#ifdef CONFIG_NVM_DEBUG
1939 atomic_long_inc(&pblk->padded_wb);
1940#endif
9f6cb13b
JG
1941 if (!pblk_ppa_empty(ppa_mapped))
1942 pblk_map_invalidate(pblk, ppa_mapped);
a4bd217b
JG
1943 return;
1944 }
1945
1946 /* logic error: lba out-of-bounds. Ignore update */
1947 if (!(lba < pblk->rl.nr_secs)) {
1948 WARN(1, "pblk: corrupted L2P map request\n");
1949 return;
1950 }
1951
1952 spin_lock(&pblk->trans_lock);
9f6cb13b 1953 ppa_l2p = pblk_trans_map_get(pblk, lba);
a4bd217b
JG
1954
1955 /* Do not update L2P if the cacheline has been updated. In this case,
1956 * the mapped ppa must be invalidated
1957 */
9f6cb13b
JG
1958 if (!pblk_ppa_comp(ppa_l2p, ppa_cache)) {
1959 if (!pblk_ppa_empty(ppa_mapped))
1960 pblk_map_invalidate(pblk, ppa_mapped);
a4bd217b
JG
1961 goto out;
1962 }
1963
1964#ifdef CONFIG_NVM_DEBUG
9f6cb13b 1965 WARN_ON(!pblk_addr_in_cache(ppa_l2p) && !pblk_ppa_empty(ppa_l2p));
a4bd217b
JG
1966#endif
1967
9f6cb13b 1968 pblk_trans_map_set(pblk, lba, ppa_mapped);
a4bd217b
JG
1969out:
1970 spin_unlock(&pblk->trans_lock);
1971}
1972
1973void pblk_lookup_l2p_seq(struct pblk *pblk, struct ppa_addr *ppas,
1974 sector_t blba, int nr_secs)
1975{
1976 int i;
1977
1978 spin_lock(&pblk->trans_lock);
7bd4d370
JG
1979 for (i = 0; i < nr_secs; i++) {
1980 struct ppa_addr ppa;
1981
1982 ppa = ppas[i] = pblk_trans_map_get(pblk, blba + i);
1983
1984 /* If the L2P entry maps to a line, the reference is valid */
1985 if (!pblk_ppa_empty(ppa) && !pblk_addr_in_cache(ppa)) {
b1bcfda1 1986 int line_id = pblk_ppa_to_line(ppa);
7bd4d370
JG
1987 struct pblk_line *line = &pblk->lines[line_id];
1988
1989 kref_get(&line->ref);
1990 }
1991 }
a4bd217b
JG
1992 spin_unlock(&pblk->trans_lock);
1993}
1994
1995void pblk_lookup_l2p_rand(struct pblk *pblk, struct ppa_addr *ppas,
1996 u64 *lba_list, int nr_secs)
1997{
d340121e 1998 u64 lba;
a4bd217b
JG
1999 int i;
2000
2001 spin_lock(&pblk->trans_lock);
2002 for (i = 0; i < nr_secs; i++) {
2003 lba = lba_list[i];
d340121e 2004 if (lba != ADDR_EMPTY) {
a4bd217b
JG
2005 /* logic error: lba out-of-bounds. Ignore update */
2006 if (!(lba < pblk->rl.nr_secs)) {
2007 WARN(1, "pblk: corrupted L2P map request\n");
2008 continue;
2009 }
2010 ppas[i] = pblk_trans_map_get(pblk, lba);
2011 }
2012 }
2013 spin_unlock(&pblk->trans_lock);
2014}