1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) 2016 CNEX Labs
4*4882a593Smuzhiyun * Initial release: Javier Gonzalez <javier@cnexlabs.com>
5*4882a593Smuzhiyun * Matias Bjorling <matias@cnexlabs.com>
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * This program is free software; you can redistribute it and/or
8*4882a593Smuzhiyun * modify it under the terms of the GNU General Public License version
9*4882a593Smuzhiyun * 2 as published by the Free Software Foundation.
10*4882a593Smuzhiyun *
11*4882a593Smuzhiyun * This program is distributed in the hope that it will be useful, but
12*4882a593Smuzhiyun * WITHOUT ANY WARRANTY; without even the implied warranty of
13*4882a593Smuzhiyun * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14*4882a593Smuzhiyun * General Public License for more details.
15*4882a593Smuzhiyun *
16*4882a593Smuzhiyun * pblk-write.c - pblk's write path from write buffer to media
17*4882a593Smuzhiyun */
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun #include "pblk.h"
20*4882a593Smuzhiyun #include "pblk-trace.h"
21*4882a593Smuzhiyun
pblk_end_w_bio(struct pblk * pblk,struct nvm_rq * rqd,struct pblk_c_ctx * c_ctx)22*4882a593Smuzhiyun static unsigned long pblk_end_w_bio(struct pblk *pblk, struct nvm_rq *rqd,
23*4882a593Smuzhiyun struct pblk_c_ctx *c_ctx)
24*4882a593Smuzhiyun {
25*4882a593Smuzhiyun struct bio *original_bio;
26*4882a593Smuzhiyun struct pblk_rb *rwb = &pblk->rwb;
27*4882a593Smuzhiyun unsigned long ret;
28*4882a593Smuzhiyun int i;
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun for (i = 0; i < c_ctx->nr_valid; i++) {
31*4882a593Smuzhiyun struct pblk_w_ctx *w_ctx;
32*4882a593Smuzhiyun int pos = c_ctx->sentry + i;
33*4882a593Smuzhiyun int flags;
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun w_ctx = pblk_rb_w_ctx(rwb, pos);
36*4882a593Smuzhiyun flags = READ_ONCE(w_ctx->flags);
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun if (flags & PBLK_FLUSH_ENTRY) {
39*4882a593Smuzhiyun flags &= ~PBLK_FLUSH_ENTRY;
40*4882a593Smuzhiyun /* Release flags on context. Protect from writes */
41*4882a593Smuzhiyun smp_store_release(&w_ctx->flags, flags);
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun #ifdef CONFIG_NVM_PBLK_DEBUG
44*4882a593Smuzhiyun atomic_dec(&rwb->inflight_flush_point);
45*4882a593Smuzhiyun #endif
46*4882a593Smuzhiyun }
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun while ((original_bio = bio_list_pop(&w_ctx->bios)))
49*4882a593Smuzhiyun bio_endio(original_bio);
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun if (c_ctx->nr_padded)
53*4882a593Smuzhiyun pblk_bio_free_pages(pblk, rqd->bio, c_ctx->nr_valid,
54*4882a593Smuzhiyun c_ctx->nr_padded);
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun #ifdef CONFIG_NVM_PBLK_DEBUG
57*4882a593Smuzhiyun atomic_long_add(rqd->nr_ppas, &pblk->sync_writes);
58*4882a593Smuzhiyun #endif
59*4882a593Smuzhiyun
60*4882a593Smuzhiyun ret = pblk_rb_sync_advance(&pblk->rwb, c_ctx->nr_valid);
61*4882a593Smuzhiyun
62*4882a593Smuzhiyun bio_put(rqd->bio);
63*4882a593Smuzhiyun pblk_free_rqd(pblk, rqd, PBLK_WRITE);
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun return ret;
66*4882a593Smuzhiyun }
67*4882a593Smuzhiyun
pblk_end_queued_w_bio(struct pblk * pblk,struct nvm_rq * rqd,struct pblk_c_ctx * c_ctx)68*4882a593Smuzhiyun static unsigned long pblk_end_queued_w_bio(struct pblk *pblk,
69*4882a593Smuzhiyun struct nvm_rq *rqd,
70*4882a593Smuzhiyun struct pblk_c_ctx *c_ctx)
71*4882a593Smuzhiyun {
72*4882a593Smuzhiyun list_del(&c_ctx->list);
73*4882a593Smuzhiyun return pblk_end_w_bio(pblk, rqd, c_ctx);
74*4882a593Smuzhiyun }
75*4882a593Smuzhiyun
pblk_complete_write(struct pblk * pblk,struct nvm_rq * rqd,struct pblk_c_ctx * c_ctx)76*4882a593Smuzhiyun static void pblk_complete_write(struct pblk *pblk, struct nvm_rq *rqd,
77*4882a593Smuzhiyun struct pblk_c_ctx *c_ctx)
78*4882a593Smuzhiyun {
79*4882a593Smuzhiyun struct pblk_c_ctx *c, *r;
80*4882a593Smuzhiyun unsigned long flags;
81*4882a593Smuzhiyun unsigned long pos;
82*4882a593Smuzhiyun
83*4882a593Smuzhiyun #ifdef CONFIG_NVM_PBLK_DEBUG
84*4882a593Smuzhiyun atomic_long_sub(c_ctx->nr_valid, &pblk->inflight_writes);
85*4882a593Smuzhiyun #endif
86*4882a593Smuzhiyun pblk_up_rq(pblk, c_ctx->lun_bitmap);
87*4882a593Smuzhiyun
88*4882a593Smuzhiyun pos = pblk_rb_sync_init(&pblk->rwb, &flags);
89*4882a593Smuzhiyun if (pos == c_ctx->sentry) {
90*4882a593Smuzhiyun pos = pblk_end_w_bio(pblk, rqd, c_ctx);
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun retry:
93*4882a593Smuzhiyun list_for_each_entry_safe(c, r, &pblk->compl_list, list) {
94*4882a593Smuzhiyun rqd = nvm_rq_from_c_ctx(c);
95*4882a593Smuzhiyun if (c->sentry == pos) {
96*4882a593Smuzhiyun pos = pblk_end_queued_w_bio(pblk, rqd, c);
97*4882a593Smuzhiyun goto retry;
98*4882a593Smuzhiyun }
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun } else {
101*4882a593Smuzhiyun WARN_ON(nvm_rq_from_c_ctx(c_ctx) != rqd);
102*4882a593Smuzhiyun list_add_tail(&c_ctx->list, &pblk->compl_list);
103*4882a593Smuzhiyun }
104*4882a593Smuzhiyun pblk_rb_sync_end(&pblk->rwb, &flags);
105*4882a593Smuzhiyun }
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun /* Map remaining sectors in chunk, starting from ppa */
pblk_map_remaining(struct pblk * pblk,struct ppa_addr * ppa,int rqd_ppas)108*4882a593Smuzhiyun static void pblk_map_remaining(struct pblk *pblk, struct ppa_addr *ppa,
109*4882a593Smuzhiyun int rqd_ppas)
110*4882a593Smuzhiyun {
111*4882a593Smuzhiyun struct pblk_line *line;
112*4882a593Smuzhiyun struct ppa_addr map_ppa = *ppa;
113*4882a593Smuzhiyun __le64 addr_empty = cpu_to_le64(ADDR_EMPTY);
114*4882a593Smuzhiyun __le64 *lba_list;
115*4882a593Smuzhiyun u64 paddr;
116*4882a593Smuzhiyun int done = 0;
117*4882a593Smuzhiyun int n = 0;
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun line = pblk_ppa_to_line(pblk, *ppa);
120*4882a593Smuzhiyun lba_list = emeta_to_lbas(pblk, line->emeta->buf);
121*4882a593Smuzhiyun
122*4882a593Smuzhiyun spin_lock(&line->lock);
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun while (!done) {
125*4882a593Smuzhiyun paddr = pblk_dev_ppa_to_line_addr(pblk, map_ppa);
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun if (!test_and_set_bit(paddr, line->map_bitmap))
128*4882a593Smuzhiyun line->left_msecs--;
129*4882a593Smuzhiyun
130*4882a593Smuzhiyun if (n < rqd_ppas && lba_list[paddr] != addr_empty)
131*4882a593Smuzhiyun line->nr_valid_lbas--;
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun lba_list[paddr] = addr_empty;
134*4882a593Smuzhiyun
135*4882a593Smuzhiyun if (!test_and_set_bit(paddr, line->invalid_bitmap))
136*4882a593Smuzhiyun le32_add_cpu(line->vsc, -1);
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun done = nvm_next_ppa_in_chk(pblk->dev, &map_ppa);
139*4882a593Smuzhiyun
140*4882a593Smuzhiyun n++;
141*4882a593Smuzhiyun }
142*4882a593Smuzhiyun
143*4882a593Smuzhiyun line->w_err_gc->has_write_err = 1;
144*4882a593Smuzhiyun spin_unlock(&line->lock);
145*4882a593Smuzhiyun }
146*4882a593Smuzhiyun
pblk_prepare_resubmit(struct pblk * pblk,unsigned int sentry,unsigned int nr_entries)147*4882a593Smuzhiyun static void pblk_prepare_resubmit(struct pblk *pblk, unsigned int sentry,
148*4882a593Smuzhiyun unsigned int nr_entries)
149*4882a593Smuzhiyun {
150*4882a593Smuzhiyun struct pblk_rb *rb = &pblk->rwb;
151*4882a593Smuzhiyun struct pblk_rb_entry *entry;
152*4882a593Smuzhiyun struct pblk_line *line;
153*4882a593Smuzhiyun struct pblk_w_ctx *w_ctx;
154*4882a593Smuzhiyun struct ppa_addr ppa_l2p;
155*4882a593Smuzhiyun int flags;
156*4882a593Smuzhiyun unsigned int i;
157*4882a593Smuzhiyun
158*4882a593Smuzhiyun spin_lock(&pblk->trans_lock);
159*4882a593Smuzhiyun for (i = 0; i < nr_entries; i++) {
160*4882a593Smuzhiyun entry = &rb->entries[pblk_rb_ptr_wrap(rb, sentry, i)];
161*4882a593Smuzhiyun w_ctx = &entry->w_ctx;
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun /* Check if the lba has been overwritten */
164*4882a593Smuzhiyun if (w_ctx->lba != ADDR_EMPTY) {
165*4882a593Smuzhiyun ppa_l2p = pblk_trans_map_get(pblk, w_ctx->lba);
166*4882a593Smuzhiyun if (!pblk_ppa_comp(ppa_l2p, entry->cacheline))
167*4882a593Smuzhiyun w_ctx->lba = ADDR_EMPTY;
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun
170*4882a593Smuzhiyun /* Mark up the entry as submittable again */
171*4882a593Smuzhiyun flags = READ_ONCE(w_ctx->flags);
172*4882a593Smuzhiyun flags |= PBLK_WRITTEN_DATA;
173*4882a593Smuzhiyun /* Release flags on write context. Protect from writes */
174*4882a593Smuzhiyun smp_store_release(&w_ctx->flags, flags);
175*4882a593Smuzhiyun
176*4882a593Smuzhiyun /* Decrease the reference count to the line as we will
177*4882a593Smuzhiyun * re-map these entries
178*4882a593Smuzhiyun */
179*4882a593Smuzhiyun line = pblk_ppa_to_line(pblk, w_ctx->ppa);
180*4882a593Smuzhiyun atomic_dec(&line->sec_to_update);
181*4882a593Smuzhiyun kref_put(&line->ref, pblk_line_put);
182*4882a593Smuzhiyun }
183*4882a593Smuzhiyun spin_unlock(&pblk->trans_lock);
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun
pblk_queue_resubmit(struct pblk * pblk,struct pblk_c_ctx * c_ctx)186*4882a593Smuzhiyun static void pblk_queue_resubmit(struct pblk *pblk, struct pblk_c_ctx *c_ctx)
187*4882a593Smuzhiyun {
188*4882a593Smuzhiyun struct pblk_c_ctx *r_ctx;
189*4882a593Smuzhiyun
190*4882a593Smuzhiyun r_ctx = kzalloc(sizeof(struct pblk_c_ctx), GFP_KERNEL);
191*4882a593Smuzhiyun if (!r_ctx)
192*4882a593Smuzhiyun return;
193*4882a593Smuzhiyun
194*4882a593Smuzhiyun r_ctx->lun_bitmap = NULL;
195*4882a593Smuzhiyun r_ctx->sentry = c_ctx->sentry;
196*4882a593Smuzhiyun r_ctx->nr_valid = c_ctx->nr_valid;
197*4882a593Smuzhiyun r_ctx->nr_padded = c_ctx->nr_padded;
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun spin_lock(&pblk->resubmit_lock);
200*4882a593Smuzhiyun list_add_tail(&r_ctx->list, &pblk->resubmit_list);
201*4882a593Smuzhiyun spin_unlock(&pblk->resubmit_lock);
202*4882a593Smuzhiyun
203*4882a593Smuzhiyun #ifdef CONFIG_NVM_PBLK_DEBUG
204*4882a593Smuzhiyun atomic_long_add(c_ctx->nr_valid, &pblk->recov_writes);
205*4882a593Smuzhiyun #endif
206*4882a593Smuzhiyun }
207*4882a593Smuzhiyun
pblk_submit_rec(struct work_struct * work)208*4882a593Smuzhiyun static void pblk_submit_rec(struct work_struct *work)
209*4882a593Smuzhiyun {
210*4882a593Smuzhiyun struct pblk_rec_ctx *recovery =
211*4882a593Smuzhiyun container_of(work, struct pblk_rec_ctx, ws_rec);
212*4882a593Smuzhiyun struct pblk *pblk = recovery->pblk;
213*4882a593Smuzhiyun struct nvm_rq *rqd = recovery->rqd;
214*4882a593Smuzhiyun struct pblk_c_ctx *c_ctx = nvm_rq_to_pdu(rqd);
215*4882a593Smuzhiyun struct ppa_addr *ppa_list = nvm_rq_to_ppa_list(rqd);
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun pblk_log_write_err(pblk, rqd);
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun pblk_map_remaining(pblk, ppa_list, rqd->nr_ppas);
220*4882a593Smuzhiyun pblk_queue_resubmit(pblk, c_ctx);
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun pblk_up_rq(pblk, c_ctx->lun_bitmap);
223*4882a593Smuzhiyun if (c_ctx->nr_padded)
224*4882a593Smuzhiyun pblk_bio_free_pages(pblk, rqd->bio, c_ctx->nr_valid,
225*4882a593Smuzhiyun c_ctx->nr_padded);
226*4882a593Smuzhiyun bio_put(rqd->bio);
227*4882a593Smuzhiyun pblk_free_rqd(pblk, rqd, PBLK_WRITE);
228*4882a593Smuzhiyun mempool_free(recovery, &pblk->rec_pool);
229*4882a593Smuzhiyun
230*4882a593Smuzhiyun atomic_dec(&pblk->inflight_io);
231*4882a593Smuzhiyun pblk_write_kick(pblk);
232*4882a593Smuzhiyun }
233*4882a593Smuzhiyun
234*4882a593Smuzhiyun
pblk_end_w_fail(struct pblk * pblk,struct nvm_rq * rqd)235*4882a593Smuzhiyun static void pblk_end_w_fail(struct pblk *pblk, struct nvm_rq *rqd)
236*4882a593Smuzhiyun {
237*4882a593Smuzhiyun struct pblk_rec_ctx *recovery;
238*4882a593Smuzhiyun
239*4882a593Smuzhiyun recovery = mempool_alloc(&pblk->rec_pool, GFP_ATOMIC);
240*4882a593Smuzhiyun if (!recovery) {
241*4882a593Smuzhiyun pblk_err(pblk, "could not allocate recovery work\n");
242*4882a593Smuzhiyun return;
243*4882a593Smuzhiyun }
244*4882a593Smuzhiyun
245*4882a593Smuzhiyun recovery->pblk = pblk;
246*4882a593Smuzhiyun recovery->rqd = rqd;
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun INIT_WORK(&recovery->ws_rec, pblk_submit_rec);
249*4882a593Smuzhiyun queue_work(pblk->close_wq, &recovery->ws_rec);
250*4882a593Smuzhiyun }
251*4882a593Smuzhiyun
pblk_end_io_write(struct nvm_rq * rqd)252*4882a593Smuzhiyun static void pblk_end_io_write(struct nvm_rq *rqd)
253*4882a593Smuzhiyun {
254*4882a593Smuzhiyun struct pblk *pblk = rqd->private;
255*4882a593Smuzhiyun struct pblk_c_ctx *c_ctx = nvm_rq_to_pdu(rqd);
256*4882a593Smuzhiyun
257*4882a593Smuzhiyun if (rqd->error) {
258*4882a593Smuzhiyun pblk_end_w_fail(pblk, rqd);
259*4882a593Smuzhiyun return;
260*4882a593Smuzhiyun } else {
261*4882a593Smuzhiyun if (trace_pblk_chunk_state_enabled())
262*4882a593Smuzhiyun pblk_check_chunk_state_update(pblk, rqd);
263*4882a593Smuzhiyun #ifdef CONFIG_NVM_PBLK_DEBUG
264*4882a593Smuzhiyun WARN_ONCE(rqd->bio->bi_status, "pblk: corrupted write error\n");
265*4882a593Smuzhiyun #endif
266*4882a593Smuzhiyun }
267*4882a593Smuzhiyun
268*4882a593Smuzhiyun pblk_complete_write(pblk, rqd, c_ctx);
269*4882a593Smuzhiyun atomic_dec(&pblk->inflight_io);
270*4882a593Smuzhiyun }
271*4882a593Smuzhiyun
pblk_end_io_write_meta(struct nvm_rq * rqd)272*4882a593Smuzhiyun static void pblk_end_io_write_meta(struct nvm_rq *rqd)
273*4882a593Smuzhiyun {
274*4882a593Smuzhiyun struct pblk *pblk = rqd->private;
275*4882a593Smuzhiyun struct pblk_g_ctx *m_ctx = nvm_rq_to_pdu(rqd);
276*4882a593Smuzhiyun struct pblk_line *line = m_ctx->private;
277*4882a593Smuzhiyun struct pblk_emeta *emeta = line->emeta;
278*4882a593Smuzhiyun struct ppa_addr *ppa_list = nvm_rq_to_ppa_list(rqd);
279*4882a593Smuzhiyun int sync;
280*4882a593Smuzhiyun
281*4882a593Smuzhiyun pblk_up_chunk(pblk, ppa_list[0]);
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun if (rqd->error) {
284*4882a593Smuzhiyun pblk_log_write_err(pblk, rqd);
285*4882a593Smuzhiyun pblk_err(pblk, "metadata I/O failed. Line %d\n", line->id);
286*4882a593Smuzhiyun line->w_err_gc->has_write_err = 1;
287*4882a593Smuzhiyun } else {
288*4882a593Smuzhiyun if (trace_pblk_chunk_state_enabled())
289*4882a593Smuzhiyun pblk_check_chunk_state_update(pblk, rqd);
290*4882a593Smuzhiyun }
291*4882a593Smuzhiyun
292*4882a593Smuzhiyun sync = atomic_add_return(rqd->nr_ppas, &emeta->sync);
293*4882a593Smuzhiyun if (sync == emeta->nr_entries)
294*4882a593Smuzhiyun pblk_gen_run_ws(pblk, line, NULL, pblk_line_close_ws,
295*4882a593Smuzhiyun GFP_ATOMIC, pblk->close_wq);
296*4882a593Smuzhiyun
297*4882a593Smuzhiyun pblk_free_rqd(pblk, rqd, PBLK_WRITE_INT);
298*4882a593Smuzhiyun
299*4882a593Smuzhiyun atomic_dec(&pblk->inflight_io);
300*4882a593Smuzhiyun }
301*4882a593Smuzhiyun
pblk_alloc_w_rq(struct pblk * pblk,struct nvm_rq * rqd,unsigned int nr_secs,nvm_end_io_fn (* end_io))302*4882a593Smuzhiyun static int pblk_alloc_w_rq(struct pblk *pblk, struct nvm_rq *rqd,
303*4882a593Smuzhiyun unsigned int nr_secs, nvm_end_io_fn(*end_io))
304*4882a593Smuzhiyun {
305*4882a593Smuzhiyun /* Setup write request */
306*4882a593Smuzhiyun rqd->opcode = NVM_OP_PWRITE;
307*4882a593Smuzhiyun rqd->nr_ppas = nr_secs;
308*4882a593Smuzhiyun rqd->is_seq = 1;
309*4882a593Smuzhiyun rqd->private = pblk;
310*4882a593Smuzhiyun rqd->end_io = end_io;
311*4882a593Smuzhiyun
312*4882a593Smuzhiyun return pblk_alloc_rqd_meta(pblk, rqd);
313*4882a593Smuzhiyun }
314*4882a593Smuzhiyun
pblk_setup_w_rq(struct pblk * pblk,struct nvm_rq * rqd,struct ppa_addr * erase_ppa)315*4882a593Smuzhiyun static int pblk_setup_w_rq(struct pblk *pblk, struct nvm_rq *rqd,
316*4882a593Smuzhiyun struct ppa_addr *erase_ppa)
317*4882a593Smuzhiyun {
318*4882a593Smuzhiyun struct pblk_line_meta *lm = &pblk->lm;
319*4882a593Smuzhiyun struct pblk_line *e_line = pblk_line_get_erase(pblk);
320*4882a593Smuzhiyun struct pblk_c_ctx *c_ctx = nvm_rq_to_pdu(rqd);
321*4882a593Smuzhiyun unsigned int valid = c_ctx->nr_valid;
322*4882a593Smuzhiyun unsigned int padded = c_ctx->nr_padded;
323*4882a593Smuzhiyun unsigned int nr_secs = valid + padded;
324*4882a593Smuzhiyun unsigned long *lun_bitmap;
325*4882a593Smuzhiyun int ret;
326*4882a593Smuzhiyun
327*4882a593Smuzhiyun lun_bitmap = kzalloc(lm->lun_bitmap_len, GFP_KERNEL);
328*4882a593Smuzhiyun if (!lun_bitmap)
329*4882a593Smuzhiyun return -ENOMEM;
330*4882a593Smuzhiyun c_ctx->lun_bitmap = lun_bitmap;
331*4882a593Smuzhiyun
332*4882a593Smuzhiyun ret = pblk_alloc_w_rq(pblk, rqd, nr_secs, pblk_end_io_write);
333*4882a593Smuzhiyun if (ret) {
334*4882a593Smuzhiyun kfree(lun_bitmap);
335*4882a593Smuzhiyun return ret;
336*4882a593Smuzhiyun }
337*4882a593Smuzhiyun
338*4882a593Smuzhiyun if (likely(!e_line || !atomic_read(&e_line->left_eblks)))
339*4882a593Smuzhiyun ret = pblk_map_rq(pblk, rqd, c_ctx->sentry, lun_bitmap,
340*4882a593Smuzhiyun valid, 0);
341*4882a593Smuzhiyun else
342*4882a593Smuzhiyun ret = pblk_map_erase_rq(pblk, rqd, c_ctx->sentry, lun_bitmap,
343*4882a593Smuzhiyun valid, erase_ppa);
344*4882a593Smuzhiyun
345*4882a593Smuzhiyun return ret;
346*4882a593Smuzhiyun }
347*4882a593Smuzhiyun
pblk_calc_secs_to_sync(struct pblk * pblk,unsigned int secs_avail,unsigned int secs_to_flush)348*4882a593Smuzhiyun static int pblk_calc_secs_to_sync(struct pblk *pblk, unsigned int secs_avail,
349*4882a593Smuzhiyun unsigned int secs_to_flush)
350*4882a593Smuzhiyun {
351*4882a593Smuzhiyun int secs_to_sync;
352*4882a593Smuzhiyun
353*4882a593Smuzhiyun secs_to_sync = pblk_calc_secs(pblk, secs_avail, secs_to_flush, true);
354*4882a593Smuzhiyun
355*4882a593Smuzhiyun #ifdef CONFIG_NVM_PBLK_DEBUG
356*4882a593Smuzhiyun if ((!secs_to_sync && secs_to_flush)
357*4882a593Smuzhiyun || (secs_to_sync < 0)
358*4882a593Smuzhiyun || (secs_to_sync > secs_avail && !secs_to_flush)) {
359*4882a593Smuzhiyun pblk_err(pblk, "bad sector calculation (a:%d,s:%d,f:%d)\n",
360*4882a593Smuzhiyun secs_avail, secs_to_sync, secs_to_flush);
361*4882a593Smuzhiyun }
362*4882a593Smuzhiyun #endif
363*4882a593Smuzhiyun
364*4882a593Smuzhiyun return secs_to_sync;
365*4882a593Smuzhiyun }
366*4882a593Smuzhiyun
pblk_submit_meta_io(struct pblk * pblk,struct pblk_line * meta_line)367*4882a593Smuzhiyun int pblk_submit_meta_io(struct pblk *pblk, struct pblk_line *meta_line)
368*4882a593Smuzhiyun {
369*4882a593Smuzhiyun struct nvm_tgt_dev *dev = pblk->dev;
370*4882a593Smuzhiyun struct nvm_geo *geo = &dev->geo;
371*4882a593Smuzhiyun struct pblk_line_mgmt *l_mg = &pblk->l_mg;
372*4882a593Smuzhiyun struct pblk_line_meta *lm = &pblk->lm;
373*4882a593Smuzhiyun struct pblk_emeta *emeta = meta_line->emeta;
374*4882a593Smuzhiyun struct ppa_addr *ppa_list;
375*4882a593Smuzhiyun struct pblk_g_ctx *m_ctx;
376*4882a593Smuzhiyun struct nvm_rq *rqd;
377*4882a593Smuzhiyun void *data;
378*4882a593Smuzhiyun u64 paddr;
379*4882a593Smuzhiyun int rq_ppas = pblk->min_write_pgs;
380*4882a593Smuzhiyun int id = meta_line->id;
381*4882a593Smuzhiyun int rq_len;
382*4882a593Smuzhiyun int i, j;
383*4882a593Smuzhiyun int ret;
384*4882a593Smuzhiyun
385*4882a593Smuzhiyun rqd = pblk_alloc_rqd(pblk, PBLK_WRITE_INT);
386*4882a593Smuzhiyun
387*4882a593Smuzhiyun m_ctx = nvm_rq_to_pdu(rqd);
388*4882a593Smuzhiyun m_ctx->private = meta_line;
389*4882a593Smuzhiyun
390*4882a593Smuzhiyun rq_len = rq_ppas * geo->csecs;
391*4882a593Smuzhiyun data = ((void *)emeta->buf) + emeta->mem;
392*4882a593Smuzhiyun
393*4882a593Smuzhiyun ret = pblk_alloc_w_rq(pblk, rqd, rq_ppas, pblk_end_io_write_meta);
394*4882a593Smuzhiyun if (ret)
395*4882a593Smuzhiyun goto fail_free_rqd;
396*4882a593Smuzhiyun
397*4882a593Smuzhiyun ppa_list = nvm_rq_to_ppa_list(rqd);
398*4882a593Smuzhiyun for (i = 0; i < rqd->nr_ppas; ) {
399*4882a593Smuzhiyun spin_lock(&meta_line->lock);
400*4882a593Smuzhiyun paddr = __pblk_alloc_page(pblk, meta_line, rq_ppas);
401*4882a593Smuzhiyun spin_unlock(&meta_line->lock);
402*4882a593Smuzhiyun for (j = 0; j < rq_ppas; j++, i++, paddr++)
403*4882a593Smuzhiyun ppa_list[i] = addr_to_gen_ppa(pblk, paddr, id);
404*4882a593Smuzhiyun }
405*4882a593Smuzhiyun
406*4882a593Smuzhiyun spin_lock(&l_mg->close_lock);
407*4882a593Smuzhiyun emeta->mem += rq_len;
408*4882a593Smuzhiyun if (emeta->mem >= lm->emeta_len[0])
409*4882a593Smuzhiyun list_del(&meta_line->list);
410*4882a593Smuzhiyun spin_unlock(&l_mg->close_lock);
411*4882a593Smuzhiyun
412*4882a593Smuzhiyun pblk_down_chunk(pblk, ppa_list[0]);
413*4882a593Smuzhiyun
414*4882a593Smuzhiyun ret = pblk_submit_io(pblk, rqd, data);
415*4882a593Smuzhiyun if (ret) {
416*4882a593Smuzhiyun pblk_err(pblk, "emeta I/O submission failed: %d\n", ret);
417*4882a593Smuzhiyun goto fail_rollback;
418*4882a593Smuzhiyun }
419*4882a593Smuzhiyun
420*4882a593Smuzhiyun return NVM_IO_OK;
421*4882a593Smuzhiyun
422*4882a593Smuzhiyun fail_rollback:
423*4882a593Smuzhiyun pblk_up_chunk(pblk, ppa_list[0]);
424*4882a593Smuzhiyun spin_lock(&l_mg->close_lock);
425*4882a593Smuzhiyun pblk_dealloc_page(pblk, meta_line, rq_ppas);
426*4882a593Smuzhiyun list_add(&meta_line->list, &meta_line->list);
427*4882a593Smuzhiyun spin_unlock(&l_mg->close_lock);
428*4882a593Smuzhiyun fail_free_rqd:
429*4882a593Smuzhiyun pblk_free_rqd(pblk, rqd, PBLK_WRITE_INT);
430*4882a593Smuzhiyun return ret;
431*4882a593Smuzhiyun }
432*4882a593Smuzhiyun
pblk_valid_meta_ppa(struct pblk * pblk,struct pblk_line * meta_line,struct nvm_rq * data_rqd)433*4882a593Smuzhiyun static inline bool pblk_valid_meta_ppa(struct pblk *pblk,
434*4882a593Smuzhiyun struct pblk_line *meta_line,
435*4882a593Smuzhiyun struct nvm_rq *data_rqd)
436*4882a593Smuzhiyun {
437*4882a593Smuzhiyun struct nvm_tgt_dev *dev = pblk->dev;
438*4882a593Smuzhiyun struct nvm_geo *geo = &dev->geo;
439*4882a593Smuzhiyun struct pblk_c_ctx *data_c_ctx = nvm_rq_to_pdu(data_rqd);
440*4882a593Smuzhiyun struct pblk_line *data_line = pblk_line_get_data(pblk);
441*4882a593Smuzhiyun struct ppa_addr ppa, ppa_opt;
442*4882a593Smuzhiyun u64 paddr;
443*4882a593Smuzhiyun int pos_opt;
444*4882a593Smuzhiyun
445*4882a593Smuzhiyun /* Schedule a metadata I/O that is half the distance from the data I/O
446*4882a593Smuzhiyun * with regards to the number of LUNs forming the pblk instance. This
447*4882a593Smuzhiyun * balances LUN conflicts across every I/O.
448*4882a593Smuzhiyun *
449*4882a593Smuzhiyun * When the LUN configuration changes (e.g., due to GC), this distance
450*4882a593Smuzhiyun * can align, which would result on metadata and data I/Os colliding. In
451*4882a593Smuzhiyun * this case, modify the distance to not be optimal, but move the
452*4882a593Smuzhiyun * optimal in the right direction.
453*4882a593Smuzhiyun */
454*4882a593Smuzhiyun paddr = pblk_lookup_page(pblk, meta_line);
455*4882a593Smuzhiyun ppa = addr_to_gen_ppa(pblk, paddr, 0);
456*4882a593Smuzhiyun ppa_opt = addr_to_gen_ppa(pblk, paddr + data_line->meta_distance, 0);
457*4882a593Smuzhiyun pos_opt = pblk_ppa_to_pos(geo, ppa_opt);
458*4882a593Smuzhiyun
459*4882a593Smuzhiyun if (test_bit(pos_opt, data_c_ctx->lun_bitmap) ||
460*4882a593Smuzhiyun test_bit(pos_opt, data_line->blk_bitmap))
461*4882a593Smuzhiyun return true;
462*4882a593Smuzhiyun
463*4882a593Smuzhiyun if (unlikely(pblk_ppa_comp(ppa_opt, ppa)))
464*4882a593Smuzhiyun data_line->meta_distance--;
465*4882a593Smuzhiyun
466*4882a593Smuzhiyun return false;
467*4882a593Smuzhiyun }
468*4882a593Smuzhiyun
pblk_should_submit_meta_io(struct pblk * pblk,struct nvm_rq * data_rqd)469*4882a593Smuzhiyun static struct pblk_line *pblk_should_submit_meta_io(struct pblk *pblk,
470*4882a593Smuzhiyun struct nvm_rq *data_rqd)
471*4882a593Smuzhiyun {
472*4882a593Smuzhiyun struct pblk_line_meta *lm = &pblk->lm;
473*4882a593Smuzhiyun struct pblk_line_mgmt *l_mg = &pblk->l_mg;
474*4882a593Smuzhiyun struct pblk_line *meta_line;
475*4882a593Smuzhiyun
476*4882a593Smuzhiyun spin_lock(&l_mg->close_lock);
477*4882a593Smuzhiyun if (list_empty(&l_mg->emeta_list)) {
478*4882a593Smuzhiyun spin_unlock(&l_mg->close_lock);
479*4882a593Smuzhiyun return NULL;
480*4882a593Smuzhiyun }
481*4882a593Smuzhiyun meta_line = list_first_entry(&l_mg->emeta_list, struct pblk_line, list);
482*4882a593Smuzhiyun if (meta_line->emeta->mem >= lm->emeta_len[0]) {
483*4882a593Smuzhiyun spin_unlock(&l_mg->close_lock);
484*4882a593Smuzhiyun return NULL;
485*4882a593Smuzhiyun }
486*4882a593Smuzhiyun spin_unlock(&l_mg->close_lock);
487*4882a593Smuzhiyun
488*4882a593Smuzhiyun if (!pblk_valid_meta_ppa(pblk, meta_line, data_rqd))
489*4882a593Smuzhiyun return NULL;
490*4882a593Smuzhiyun
491*4882a593Smuzhiyun return meta_line;
492*4882a593Smuzhiyun }
493*4882a593Smuzhiyun
pblk_submit_io_set(struct pblk * pblk,struct nvm_rq * rqd)494*4882a593Smuzhiyun static int pblk_submit_io_set(struct pblk *pblk, struct nvm_rq *rqd)
495*4882a593Smuzhiyun {
496*4882a593Smuzhiyun struct ppa_addr erase_ppa;
497*4882a593Smuzhiyun struct pblk_line *meta_line;
498*4882a593Smuzhiyun int err;
499*4882a593Smuzhiyun
500*4882a593Smuzhiyun pblk_ppa_set_empty(&erase_ppa);
501*4882a593Smuzhiyun
502*4882a593Smuzhiyun /* Assign lbas to ppas and populate request structure */
503*4882a593Smuzhiyun err = pblk_setup_w_rq(pblk, rqd, &erase_ppa);
504*4882a593Smuzhiyun if (err) {
505*4882a593Smuzhiyun pblk_err(pblk, "could not setup write request: %d\n", err);
506*4882a593Smuzhiyun return NVM_IO_ERR;
507*4882a593Smuzhiyun }
508*4882a593Smuzhiyun
509*4882a593Smuzhiyun meta_line = pblk_should_submit_meta_io(pblk, rqd);
510*4882a593Smuzhiyun
511*4882a593Smuzhiyun /* Submit data write for current data line */
512*4882a593Smuzhiyun err = pblk_submit_io(pblk, rqd, NULL);
513*4882a593Smuzhiyun if (err) {
514*4882a593Smuzhiyun pblk_err(pblk, "data I/O submission failed: %d\n", err);
515*4882a593Smuzhiyun return NVM_IO_ERR;
516*4882a593Smuzhiyun }
517*4882a593Smuzhiyun
518*4882a593Smuzhiyun if (!pblk_ppa_empty(erase_ppa)) {
519*4882a593Smuzhiyun /* Submit erase for next data line */
520*4882a593Smuzhiyun if (pblk_blk_erase_async(pblk, erase_ppa)) {
521*4882a593Smuzhiyun struct pblk_line *e_line = pblk_line_get_erase(pblk);
522*4882a593Smuzhiyun struct nvm_tgt_dev *dev = pblk->dev;
523*4882a593Smuzhiyun struct nvm_geo *geo = &dev->geo;
524*4882a593Smuzhiyun int bit;
525*4882a593Smuzhiyun
526*4882a593Smuzhiyun atomic_inc(&e_line->left_eblks);
527*4882a593Smuzhiyun bit = pblk_ppa_to_pos(geo, erase_ppa);
528*4882a593Smuzhiyun WARN_ON(!test_and_clear_bit(bit, e_line->erase_bitmap));
529*4882a593Smuzhiyun }
530*4882a593Smuzhiyun }
531*4882a593Smuzhiyun
532*4882a593Smuzhiyun if (meta_line) {
533*4882a593Smuzhiyun /* Submit metadata write for previous data line */
534*4882a593Smuzhiyun err = pblk_submit_meta_io(pblk, meta_line);
535*4882a593Smuzhiyun if (err) {
536*4882a593Smuzhiyun pblk_err(pblk, "metadata I/O submission failed: %d",
537*4882a593Smuzhiyun err);
538*4882a593Smuzhiyun return NVM_IO_ERR;
539*4882a593Smuzhiyun }
540*4882a593Smuzhiyun }
541*4882a593Smuzhiyun
542*4882a593Smuzhiyun return NVM_IO_OK;
543*4882a593Smuzhiyun }
544*4882a593Smuzhiyun
pblk_free_write_rqd(struct pblk * pblk,struct nvm_rq * rqd)545*4882a593Smuzhiyun static void pblk_free_write_rqd(struct pblk *pblk, struct nvm_rq *rqd)
546*4882a593Smuzhiyun {
547*4882a593Smuzhiyun struct pblk_c_ctx *c_ctx = nvm_rq_to_pdu(rqd);
548*4882a593Smuzhiyun struct bio *bio = rqd->bio;
549*4882a593Smuzhiyun
550*4882a593Smuzhiyun if (c_ctx->nr_padded)
551*4882a593Smuzhiyun pblk_bio_free_pages(pblk, bio, c_ctx->nr_valid,
552*4882a593Smuzhiyun c_ctx->nr_padded);
553*4882a593Smuzhiyun }
554*4882a593Smuzhiyun
pblk_submit_write(struct pblk * pblk,int * secs_left)555*4882a593Smuzhiyun static int pblk_submit_write(struct pblk *pblk, int *secs_left)
556*4882a593Smuzhiyun {
557*4882a593Smuzhiyun struct bio *bio;
558*4882a593Smuzhiyun struct nvm_rq *rqd;
559*4882a593Smuzhiyun unsigned int secs_avail, secs_to_sync, secs_to_com;
560*4882a593Smuzhiyun unsigned int secs_to_flush, packed_meta_pgs;
561*4882a593Smuzhiyun unsigned long pos;
562*4882a593Smuzhiyun unsigned int resubmit;
563*4882a593Smuzhiyun
564*4882a593Smuzhiyun *secs_left = 0;
565*4882a593Smuzhiyun
566*4882a593Smuzhiyun spin_lock(&pblk->resubmit_lock);
567*4882a593Smuzhiyun resubmit = !list_empty(&pblk->resubmit_list);
568*4882a593Smuzhiyun spin_unlock(&pblk->resubmit_lock);
569*4882a593Smuzhiyun
570*4882a593Smuzhiyun /* Resubmit failed writes first */
571*4882a593Smuzhiyun if (resubmit) {
572*4882a593Smuzhiyun struct pblk_c_ctx *r_ctx;
573*4882a593Smuzhiyun
574*4882a593Smuzhiyun spin_lock(&pblk->resubmit_lock);
575*4882a593Smuzhiyun r_ctx = list_first_entry(&pblk->resubmit_list,
576*4882a593Smuzhiyun struct pblk_c_ctx, list);
577*4882a593Smuzhiyun list_del(&r_ctx->list);
578*4882a593Smuzhiyun spin_unlock(&pblk->resubmit_lock);
579*4882a593Smuzhiyun
580*4882a593Smuzhiyun secs_avail = r_ctx->nr_valid;
581*4882a593Smuzhiyun pos = r_ctx->sentry;
582*4882a593Smuzhiyun
583*4882a593Smuzhiyun pblk_prepare_resubmit(pblk, pos, secs_avail);
584*4882a593Smuzhiyun secs_to_sync = pblk_calc_secs_to_sync(pblk, secs_avail,
585*4882a593Smuzhiyun secs_avail);
586*4882a593Smuzhiyun
587*4882a593Smuzhiyun kfree(r_ctx);
588*4882a593Smuzhiyun } else {
589*4882a593Smuzhiyun /* If there are no sectors in the cache,
590*4882a593Smuzhiyun * flushes (bios without data) will be cleared on
591*4882a593Smuzhiyun * the cache threads
592*4882a593Smuzhiyun */
593*4882a593Smuzhiyun secs_avail = pblk_rb_read_count(&pblk->rwb);
594*4882a593Smuzhiyun if (!secs_avail)
595*4882a593Smuzhiyun return 0;
596*4882a593Smuzhiyun
597*4882a593Smuzhiyun secs_to_flush = pblk_rb_flush_point_count(&pblk->rwb);
598*4882a593Smuzhiyun if (!secs_to_flush && secs_avail < pblk->min_write_pgs_data)
599*4882a593Smuzhiyun return 0;
600*4882a593Smuzhiyun
601*4882a593Smuzhiyun secs_to_sync = pblk_calc_secs_to_sync(pblk, secs_avail,
602*4882a593Smuzhiyun secs_to_flush);
603*4882a593Smuzhiyun if (secs_to_sync > pblk->max_write_pgs) {
604*4882a593Smuzhiyun pblk_err(pblk, "bad buffer sync calculation\n");
605*4882a593Smuzhiyun return 0;
606*4882a593Smuzhiyun }
607*4882a593Smuzhiyun
608*4882a593Smuzhiyun secs_to_com = (secs_to_sync > secs_avail) ?
609*4882a593Smuzhiyun secs_avail : secs_to_sync;
610*4882a593Smuzhiyun pos = pblk_rb_read_commit(&pblk->rwb, secs_to_com);
611*4882a593Smuzhiyun }
612*4882a593Smuzhiyun
613*4882a593Smuzhiyun packed_meta_pgs = (pblk->min_write_pgs - pblk->min_write_pgs_data);
614*4882a593Smuzhiyun bio = bio_alloc(GFP_KERNEL, secs_to_sync + packed_meta_pgs);
615*4882a593Smuzhiyun
616*4882a593Smuzhiyun bio->bi_iter.bi_sector = 0; /* internal bio */
617*4882a593Smuzhiyun bio_set_op_attrs(bio, REQ_OP_WRITE, 0);
618*4882a593Smuzhiyun
619*4882a593Smuzhiyun rqd = pblk_alloc_rqd(pblk, PBLK_WRITE);
620*4882a593Smuzhiyun rqd->bio = bio;
621*4882a593Smuzhiyun
622*4882a593Smuzhiyun if (pblk_rb_read_to_bio(&pblk->rwb, rqd, pos, secs_to_sync,
623*4882a593Smuzhiyun secs_avail)) {
624*4882a593Smuzhiyun pblk_err(pblk, "corrupted write bio\n");
625*4882a593Smuzhiyun goto fail_put_bio;
626*4882a593Smuzhiyun }
627*4882a593Smuzhiyun
628*4882a593Smuzhiyun if (pblk_submit_io_set(pblk, rqd))
629*4882a593Smuzhiyun goto fail_free_bio;
630*4882a593Smuzhiyun
631*4882a593Smuzhiyun #ifdef CONFIG_NVM_PBLK_DEBUG
632*4882a593Smuzhiyun atomic_long_add(secs_to_sync, &pblk->sub_writes);
633*4882a593Smuzhiyun #endif
634*4882a593Smuzhiyun
635*4882a593Smuzhiyun *secs_left = 1;
636*4882a593Smuzhiyun return 0;
637*4882a593Smuzhiyun
638*4882a593Smuzhiyun fail_free_bio:
639*4882a593Smuzhiyun pblk_free_write_rqd(pblk, rqd);
640*4882a593Smuzhiyun fail_put_bio:
641*4882a593Smuzhiyun bio_put(bio);
642*4882a593Smuzhiyun pblk_free_rqd(pblk, rqd, PBLK_WRITE);
643*4882a593Smuzhiyun
644*4882a593Smuzhiyun return -EINTR;
645*4882a593Smuzhiyun }
646*4882a593Smuzhiyun
pblk_write_ts(void * data)647*4882a593Smuzhiyun int pblk_write_ts(void *data)
648*4882a593Smuzhiyun {
649*4882a593Smuzhiyun struct pblk *pblk = data;
650*4882a593Smuzhiyun int secs_left;
651*4882a593Smuzhiyun int write_failure = 0;
652*4882a593Smuzhiyun
653*4882a593Smuzhiyun while (!kthread_should_stop()) {
654*4882a593Smuzhiyun if (!write_failure) {
655*4882a593Smuzhiyun write_failure = pblk_submit_write(pblk, &secs_left);
656*4882a593Smuzhiyun
657*4882a593Smuzhiyun if (secs_left)
658*4882a593Smuzhiyun continue;
659*4882a593Smuzhiyun }
660*4882a593Smuzhiyun set_current_state(TASK_INTERRUPTIBLE);
661*4882a593Smuzhiyun io_schedule();
662*4882a593Smuzhiyun }
663*4882a593Smuzhiyun
664*4882a593Smuzhiyun return 0;
665*4882a593Smuzhiyun }
666