1 // SPDX-License-Identifier: GPL-2.0
2
3 #define dev_fmt(fmt) "mtdoops-pstore: " fmt
4
5 #include <linux/kernel.h>
6 #include <linux/module.h>
7 #include <linux/pstore_blk.h>
8 #include <linux/mtd/mtd.h>
9 #include <linux/bitops.h>
10 #include <linux/slab.h>
11
12 static struct mtdpstore_context {
13 int index;
14 struct pstore_blk_config info;
15 struct pstore_device_info dev;
16 struct mtd_info *mtd;
17 unsigned long *rmmap; /* removed bit map */
18 unsigned long *usedmap; /* used bit map */
19 /*
20 * used for panic write
21 * As there are no block_isbad for panic case, we should keep this
22 * status before panic to ensure panic_write not failed.
23 */
24 unsigned long *badmap; /* bad block bit map */
25 } oops_cxt;
26
mtdpstore_block_isbad(struct mtdpstore_context * cxt,loff_t off)27 static int mtdpstore_block_isbad(struct mtdpstore_context *cxt, loff_t off)
28 {
29 int ret;
30 struct mtd_info *mtd = cxt->mtd;
31 u64 blknum;
32
33 off = ALIGN_DOWN(off, mtd->erasesize);
34 blknum = div_u64(off, mtd->erasesize);
35
36 if (test_bit(blknum, cxt->badmap))
37 return true;
38 ret = mtd_block_isbad(mtd, off);
39 if (ret < 0) {
40 dev_err(&mtd->dev, "mtd_block_isbad failed, aborting\n");
41 return ret;
42 } else if (ret > 0) {
43 set_bit(blknum, cxt->badmap);
44 return true;
45 }
46 return false;
47 }
48
mtdpstore_panic_block_isbad(struct mtdpstore_context * cxt,loff_t off)49 static inline int mtdpstore_panic_block_isbad(struct mtdpstore_context *cxt,
50 loff_t off)
51 {
52 struct mtd_info *mtd = cxt->mtd;
53 u64 blknum;
54
55 off = ALIGN_DOWN(off, mtd->erasesize);
56 blknum = div_u64(off, mtd->erasesize);
57 return test_bit(blknum, cxt->badmap);
58 }
59
mtdpstore_mark_used(struct mtdpstore_context * cxt,loff_t off)60 static inline void mtdpstore_mark_used(struct mtdpstore_context *cxt,
61 loff_t off)
62 {
63 struct mtd_info *mtd = cxt->mtd;
64 u64 zonenum = div_u64(off, cxt->info.kmsg_size);
65
66 dev_dbg(&mtd->dev, "mark zone %llu used\n", zonenum);
67 set_bit(zonenum, cxt->usedmap);
68 }
69
mtdpstore_mark_unused(struct mtdpstore_context * cxt,loff_t off)70 static inline void mtdpstore_mark_unused(struct mtdpstore_context *cxt,
71 loff_t off)
72 {
73 struct mtd_info *mtd = cxt->mtd;
74 u64 zonenum = div_u64(off, cxt->info.kmsg_size);
75
76 dev_dbg(&mtd->dev, "mark zone %llu unused\n", zonenum);
77 clear_bit(zonenum, cxt->usedmap);
78 }
79
mtdpstore_block_mark_unused(struct mtdpstore_context * cxt,loff_t off)80 static inline void mtdpstore_block_mark_unused(struct mtdpstore_context *cxt,
81 loff_t off)
82 {
83 struct mtd_info *mtd = cxt->mtd;
84 u32 zonecnt = mtd->erasesize / cxt->info.kmsg_size;
85 u64 zonenum;
86
87 off = ALIGN_DOWN(off, mtd->erasesize);
88 zonenum = div_u64(off, cxt->info.kmsg_size);
89 while (zonecnt > 0) {
90 dev_dbg(&mtd->dev, "mark zone %llu unused\n", zonenum);
91 clear_bit(zonenum, cxt->usedmap);
92 zonenum++;
93 zonecnt--;
94 }
95 }
96
mtdpstore_is_used(struct mtdpstore_context * cxt,loff_t off)97 static inline int mtdpstore_is_used(struct mtdpstore_context *cxt, loff_t off)
98 {
99 u64 zonenum = div_u64(off, cxt->info.kmsg_size);
100 u64 blknum = div_u64(off, cxt->mtd->erasesize);
101
102 if (test_bit(blknum, cxt->badmap))
103 return true;
104 return test_bit(zonenum, cxt->usedmap);
105 }
106
mtdpstore_block_is_used(struct mtdpstore_context * cxt,loff_t off)107 static int mtdpstore_block_is_used(struct mtdpstore_context *cxt,
108 loff_t off)
109 {
110 struct mtd_info *mtd = cxt->mtd;
111 u32 zonecnt = mtd->erasesize / cxt->info.kmsg_size;
112 u64 zonenum;
113
114 off = ALIGN_DOWN(off, mtd->erasesize);
115 zonenum = div_u64(off, cxt->info.kmsg_size);
116 while (zonecnt > 0) {
117 if (test_bit(zonenum, cxt->usedmap))
118 return true;
119 zonenum++;
120 zonecnt--;
121 }
122 return false;
123 }
124
mtdpstore_is_empty(struct mtdpstore_context * cxt,char * buf,size_t size)125 static int mtdpstore_is_empty(struct mtdpstore_context *cxt, char *buf,
126 size_t size)
127 {
128 struct mtd_info *mtd = cxt->mtd;
129 size_t sz;
130 int i;
131
132 sz = min_t(uint32_t, size, mtd->writesize / 4);
133 for (i = 0; i < sz; i++) {
134 if (buf[i] != (char)0xFF)
135 return false;
136 }
137 return true;
138 }
139
mtdpstore_mark_removed(struct mtdpstore_context * cxt,loff_t off)140 static void mtdpstore_mark_removed(struct mtdpstore_context *cxt, loff_t off)
141 {
142 struct mtd_info *mtd = cxt->mtd;
143 u64 zonenum = div_u64(off, cxt->info.kmsg_size);
144
145 dev_dbg(&mtd->dev, "mark zone %llu removed\n", zonenum);
146 set_bit(zonenum, cxt->rmmap);
147 }
148
mtdpstore_block_clear_removed(struct mtdpstore_context * cxt,loff_t off)149 static void mtdpstore_block_clear_removed(struct mtdpstore_context *cxt,
150 loff_t off)
151 {
152 struct mtd_info *mtd = cxt->mtd;
153 u32 zonecnt = mtd->erasesize / cxt->info.kmsg_size;
154 u64 zonenum;
155
156 off = ALIGN_DOWN(off, mtd->erasesize);
157 zonenum = div_u64(off, cxt->info.kmsg_size);
158 while (zonecnt > 0) {
159 clear_bit(zonenum, cxt->rmmap);
160 zonenum++;
161 zonecnt--;
162 }
163 }
164
mtdpstore_block_is_removed(struct mtdpstore_context * cxt,loff_t off)165 static int mtdpstore_block_is_removed(struct mtdpstore_context *cxt,
166 loff_t off)
167 {
168 struct mtd_info *mtd = cxt->mtd;
169 u32 zonecnt = mtd->erasesize / cxt->info.kmsg_size;
170 u64 zonenum;
171
172 off = ALIGN_DOWN(off, mtd->erasesize);
173 zonenum = div_u64(off, cxt->info.kmsg_size);
174 while (zonecnt > 0) {
175 if (test_bit(zonenum, cxt->rmmap))
176 return true;
177 zonenum++;
178 zonecnt--;
179 }
180 return false;
181 }
182
mtdpstore_erase_do(struct mtdpstore_context * cxt,loff_t off)183 static int mtdpstore_erase_do(struct mtdpstore_context *cxt, loff_t off)
184 {
185 struct mtd_info *mtd = cxt->mtd;
186 struct erase_info erase;
187 int ret;
188
189 off = ALIGN_DOWN(off, cxt->mtd->erasesize);
190 dev_dbg(&mtd->dev, "try to erase off 0x%llx\n", off);
191 erase.len = cxt->mtd->erasesize;
192 erase.addr = off;
193 ret = mtd_erase(cxt->mtd, &erase);
194 if (!ret)
195 mtdpstore_block_clear_removed(cxt, off);
196 else
197 dev_err(&mtd->dev, "erase of region [0x%llx, 0x%llx] on \"%s\" failed\n",
198 (unsigned long long)erase.addr,
199 (unsigned long long)erase.len, cxt->info.device);
200 return ret;
201 }
202
203 /*
204 * called while removing file
205 *
206 * Avoiding over erasing, do erase block only when the whole block is unused.
207 * If the block contains valid log, do erase lazily on flush_removed() when
208 * unregister.
209 */
mtdpstore_erase(size_t size,loff_t off)210 static ssize_t mtdpstore_erase(size_t size, loff_t off)
211 {
212 struct mtdpstore_context *cxt = &oops_cxt;
213
214 if (mtdpstore_block_isbad(cxt, off))
215 return -EIO;
216
217 mtdpstore_mark_unused(cxt, off);
218
219 /* If the block still has valid data, mtdpstore do erase lazily */
220 if (likely(mtdpstore_block_is_used(cxt, off))) {
221 mtdpstore_mark_removed(cxt, off);
222 return 0;
223 }
224
225 /* all zones are unused, erase it */
226 return mtdpstore_erase_do(cxt, off);
227 }
228
229 /*
230 * What is security for mtdpstore?
231 * As there is no erase for panic case, we should ensure at least one zone
232 * is writable. Otherwise, panic write will fail.
233 * If zone is used, write operation will return -ENOMSG, which means that
234 * pstore/blk will try one by one until gets an empty zone. So, it is not
235 * needed to ensure the next zone is empty, but at least one.
236 */
mtdpstore_security(struct mtdpstore_context * cxt,loff_t off)237 static int mtdpstore_security(struct mtdpstore_context *cxt, loff_t off)
238 {
239 int ret = 0, i;
240 struct mtd_info *mtd = cxt->mtd;
241 u32 zonenum = (u32)div_u64(off, cxt->info.kmsg_size);
242 u32 zonecnt = (u32)div_u64(cxt->mtd->size, cxt->info.kmsg_size);
243 u32 blkcnt = (u32)div_u64(cxt->mtd->size, cxt->mtd->erasesize);
244 u32 erasesize = cxt->mtd->erasesize;
245
246 for (i = 0; i < zonecnt; i++) {
247 u32 num = (zonenum + i) % zonecnt;
248
249 /* found empty zone */
250 if (!test_bit(num, cxt->usedmap))
251 return 0;
252 }
253
254 /* If there is no any empty zone, we have no way but to do erase */
255 while (blkcnt--) {
256 div64_u64_rem(off + erasesize, cxt->mtd->size, (u64 *)&off);
257
258 if (mtdpstore_block_isbad(cxt, off))
259 continue;
260
261 ret = mtdpstore_erase_do(cxt, off);
262 if (!ret) {
263 mtdpstore_block_mark_unused(cxt, off);
264 break;
265 }
266 }
267
268 if (ret)
269 dev_err(&mtd->dev, "all blocks bad!\n");
270 dev_dbg(&mtd->dev, "end security\n");
271 return ret;
272 }
273
mtdpstore_write(const char * buf,size_t size,loff_t off)274 static ssize_t mtdpstore_write(const char *buf, size_t size, loff_t off)
275 {
276 struct mtdpstore_context *cxt = &oops_cxt;
277 struct mtd_info *mtd = cxt->mtd;
278 size_t retlen;
279 int ret;
280
281 if (mtdpstore_block_isbad(cxt, off))
282 return -ENOMSG;
283
284 /* zone is used, please try next one */
285 if (mtdpstore_is_used(cxt, off))
286 return -ENOMSG;
287
288 dev_dbg(&mtd->dev, "try to write off 0x%llx size %zu\n", off, size);
289 ret = mtd_write(cxt->mtd, off, size, &retlen, (u_char *)buf);
290 if (ret < 0 || retlen != size) {
291 dev_err(&mtd->dev, "write failure at %lld (%zu of %zu written), err %d\n",
292 off, retlen, size, ret);
293 return -EIO;
294 }
295 mtdpstore_mark_used(cxt, off);
296
297 mtdpstore_security(cxt, off);
298 return retlen;
299 }
300
mtdpstore_is_io_error(int ret)301 static inline bool mtdpstore_is_io_error(int ret)
302 {
303 return ret < 0 && !mtd_is_bitflip(ret) && !mtd_is_eccerr(ret);
304 }
305
306 /*
307 * All zones will be read as pstore/blk will read zone one by one when do
308 * recover.
309 */
mtdpstore_read(char * buf,size_t size,loff_t off)310 static ssize_t mtdpstore_read(char *buf, size_t size, loff_t off)
311 {
312 struct mtdpstore_context *cxt = &oops_cxt;
313 struct mtd_info *mtd = cxt->mtd;
314 size_t retlen, done;
315 int ret;
316
317 if (mtdpstore_block_isbad(cxt, off))
318 return -ENOMSG;
319
320 dev_dbg(&mtd->dev, "try to read off 0x%llx size %zu\n", off, size);
321 for (done = 0, retlen = 0; done < size; done += retlen) {
322 retlen = 0;
323
324 ret = mtd_read(cxt->mtd, off + done, size - done, &retlen,
325 (u_char *)buf + done);
326 if (mtdpstore_is_io_error(ret)) {
327 dev_err(&mtd->dev, "read failure at %lld (%zu of %zu read), err %d\n",
328 off + done, retlen, size - done, ret);
329 /* the zone may be broken, try next one */
330 return -ENOMSG;
331 }
332
333 /*
334 * ECC error. The impact on log data is so small. Maybe we can
335 * still read it and try to understand. So mtdpstore just hands
336 * over what it gets and user can judge whether the data is
337 * valid or not.
338 */
339 if (mtd_is_eccerr(ret)) {
340 dev_err(&mtd->dev, "ecc error at %lld (%zu of %zu read), err %d\n",
341 off + done, retlen, size - done, ret);
342 /* driver may not set retlen when ecc error */
343 retlen = retlen == 0 ? size - done : retlen;
344 }
345 }
346
347 if (mtdpstore_is_empty(cxt, buf, size))
348 mtdpstore_mark_unused(cxt, off);
349 else
350 mtdpstore_mark_used(cxt, off);
351
352 mtdpstore_security(cxt, off);
353 return retlen;
354 }
355
mtdpstore_panic_write(const char * buf,size_t size,loff_t off)356 static ssize_t mtdpstore_panic_write(const char *buf, size_t size, loff_t off)
357 {
358 struct mtdpstore_context *cxt = &oops_cxt;
359 struct mtd_info *mtd = cxt->mtd;
360 size_t retlen;
361 int ret;
362
363 if (mtdpstore_panic_block_isbad(cxt, off))
364 return -ENOMSG;
365
366 /* zone is used, please try next one */
367 if (mtdpstore_is_used(cxt, off))
368 return -ENOMSG;
369
370 ret = mtd_panic_write(cxt->mtd, off, size, &retlen, (u_char *)buf);
371 if (ret < 0 || size != retlen) {
372 dev_err(&mtd->dev, "panic write failure at %lld (%zu of %zu read), err %d\n",
373 off, retlen, size, ret);
374 return -EIO;
375 }
376 mtdpstore_mark_used(cxt, off);
377
378 return retlen;
379 }
380
mtdpstore_notify_add(struct mtd_info * mtd)381 static void mtdpstore_notify_add(struct mtd_info *mtd)
382 {
383 int ret;
384 struct mtdpstore_context *cxt = &oops_cxt;
385 struct pstore_blk_config *info = &cxt->info;
386 unsigned long longcnt;
387
388 if (!strcmp(mtd->name, info->device))
389 cxt->index = mtd->index;
390
391 if (mtd->index != cxt->index || cxt->index < 0)
392 return;
393
394 dev_dbg(&mtd->dev, "found matching MTD device %s\n", mtd->name);
395
396 if (mtd->size < info->kmsg_size * 2) {
397 dev_err(&mtd->dev, "MTD partition %d not big enough\n",
398 mtd->index);
399 return;
400 }
401 /*
402 * kmsg_size must be aligned to 4096 Bytes, which is limited by
403 * psblk. The default value of kmsg_size is 64KB. If kmsg_size
404 * is larger than erasesize, some errors will occur since mtdpstore
405 * is designed on it.
406 */
407 if (mtd->erasesize < info->kmsg_size) {
408 dev_err(&mtd->dev, "eraseblock size of MTD partition %d too small\n",
409 mtd->index);
410 return;
411 }
412 if (unlikely(info->kmsg_size % mtd->writesize)) {
413 dev_err(&mtd->dev, "record size %lu KB must align to write size %d KB\n",
414 info->kmsg_size / 1024,
415 mtd->writesize / 1024);
416 return;
417 }
418
419 longcnt = BITS_TO_LONGS(div_u64(mtd->size, info->kmsg_size));
420 cxt->rmmap = kcalloc(longcnt, sizeof(long), GFP_KERNEL);
421 cxt->usedmap = kcalloc(longcnt, sizeof(long), GFP_KERNEL);
422
423 longcnt = BITS_TO_LONGS(div_u64(mtd->size, mtd->erasesize));
424 cxt->badmap = kcalloc(longcnt, sizeof(long), GFP_KERNEL);
425
426 /* just support dmesg right now */
427 cxt->dev.flags = PSTORE_FLAGS_DMESG;
428 cxt->dev.zone.read = mtdpstore_read;
429 cxt->dev.zone.write = mtdpstore_write;
430 cxt->dev.zone.erase = mtdpstore_erase;
431 cxt->dev.zone.panic_write = mtdpstore_panic_write;
432 cxt->dev.zone.total_size = mtd->size;
433
434 ret = register_pstore_device(&cxt->dev);
435 if (ret) {
436 dev_err(&mtd->dev, "mtd%d register to psblk failed\n",
437 mtd->index);
438 return;
439 }
440 cxt->mtd = mtd;
441 dev_info(&mtd->dev, "Attached to MTD device %d\n", mtd->index);
442 }
443
mtdpstore_flush_removed_do(struct mtdpstore_context * cxt,loff_t off,size_t size)444 static int mtdpstore_flush_removed_do(struct mtdpstore_context *cxt,
445 loff_t off, size_t size)
446 {
447 struct mtd_info *mtd = cxt->mtd;
448 u_char *buf;
449 int ret;
450 size_t retlen;
451 struct erase_info erase;
452
453 buf = kmalloc(mtd->erasesize, GFP_KERNEL);
454 if (!buf)
455 return -ENOMEM;
456
457 /* 1st. read to cache */
458 ret = mtd_read(mtd, off, mtd->erasesize, &retlen, buf);
459 if (mtdpstore_is_io_error(ret))
460 goto free;
461
462 /* 2nd. erase block */
463 erase.len = mtd->erasesize;
464 erase.addr = off;
465 ret = mtd_erase(mtd, &erase);
466 if (ret)
467 goto free;
468
469 /* 3rd. write back */
470 while (size) {
471 unsigned int zonesize = cxt->info.kmsg_size;
472
473 /* there is valid data on block, write back */
474 if (mtdpstore_is_used(cxt, off)) {
475 ret = mtd_write(mtd, off, zonesize, &retlen, buf);
476 if (ret)
477 dev_err(&mtd->dev, "write failure at %lld (%zu of %u written), err %d\n",
478 off, retlen, zonesize, ret);
479 }
480
481 off += zonesize;
482 size -= min_t(unsigned int, zonesize, size);
483 }
484
485 free:
486 kfree(buf);
487 return ret;
488 }
489
490 /*
491 * What does mtdpstore_flush_removed() do?
492 * When user remove any log file on pstore filesystem, mtdpstore should do
493 * something to ensure log file removed. If the whole block is no longer used,
494 * it's nice to erase the block. However if the block still contains valid log,
495 * what mtdpstore can do is to erase and write the valid log back.
496 */
mtdpstore_flush_removed(struct mtdpstore_context * cxt)497 static int mtdpstore_flush_removed(struct mtdpstore_context *cxt)
498 {
499 struct mtd_info *mtd = cxt->mtd;
500 int ret;
501 loff_t off;
502 u32 blkcnt = (u32)div_u64(mtd->size, mtd->erasesize);
503
504 for (off = 0; blkcnt > 0; blkcnt--, off += mtd->erasesize) {
505 ret = mtdpstore_block_isbad(cxt, off);
506 if (ret)
507 continue;
508
509 ret = mtdpstore_block_is_removed(cxt, off);
510 if (!ret)
511 continue;
512
513 ret = mtdpstore_flush_removed_do(cxt, off, mtd->erasesize);
514 if (ret)
515 return ret;
516 }
517 return 0;
518 }
519
mtdpstore_notify_remove(struct mtd_info * mtd)520 static void mtdpstore_notify_remove(struct mtd_info *mtd)
521 {
522 struct mtdpstore_context *cxt = &oops_cxt;
523
524 if (mtd->index != cxt->index || cxt->index < 0)
525 return;
526
527 mtdpstore_flush_removed(cxt);
528
529 unregister_pstore_device(&cxt->dev);
530 kfree(cxt->badmap);
531 kfree(cxt->usedmap);
532 kfree(cxt->rmmap);
533 cxt->mtd = NULL;
534 cxt->index = -1;
535 }
536
537 static struct mtd_notifier mtdpstore_notifier = {
538 .add = mtdpstore_notify_add,
539 .remove = mtdpstore_notify_remove,
540 };
541
mtdpstore_init(void)542 static int __init mtdpstore_init(void)
543 {
544 int ret;
545 struct mtdpstore_context *cxt = &oops_cxt;
546 struct pstore_blk_config *info = &cxt->info;
547
548 ret = pstore_blk_get_config(info);
549 if (unlikely(ret))
550 return ret;
551
552 if (strlen(info->device) == 0) {
553 pr_err("mtd device must be supplied (device name is empty)\n");
554 return -EINVAL;
555 }
556 if (!info->kmsg_size) {
557 pr_err("no backend enabled (kmsg_size is 0)\n");
558 return -EINVAL;
559 }
560
561 /* Setup the MTD device to use */
562 ret = kstrtoint((char *)info->device, 0, &cxt->index);
563 if (ret)
564 cxt->index = -1;
565
566 register_mtd_user(&mtdpstore_notifier);
567 return 0;
568 }
569 module_init(mtdpstore_init);
570
mtdpstore_exit(void)571 static void __exit mtdpstore_exit(void)
572 {
573 unregister_mtd_user(&mtdpstore_notifier);
574 }
575 module_exit(mtdpstore_exit);
576
577 MODULE_LICENSE("GPL");
578 MODULE_AUTHOR("WeiXiong Liao <liaoweixiong@allwinnertech.com>");
579 MODULE_DESCRIPTION("MTD backend for pstore/blk");
580