ac321e217d574661205cd6a617c591404d69cb68
[platform/kernel/linux-rpi.git] / fs / f2fs / compress.c
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * f2fs compress support
4  *
5  * Copyright (c) 2019 Chao Yu <chao@kernel.org>
6  */
7
8 #include <linux/fs.h>
9 #include <linux/f2fs_fs.h>
10 #include <linux/writeback.h>
11 #include <linux/backing-dev.h>
12 #include <linux/lzo.h>
13 #include <linux/lz4.h>
14 #include <linux/zstd.h>
15
16 #include "f2fs.h"
17 #include "node.h"
18 #include <trace/events/f2fs.h>
19
20 static struct kmem_cache *cic_entry_slab;
21 static struct kmem_cache *dic_entry_slab;
22
23 static void *page_array_alloc(struct inode *inode, int nr)
24 {
25         struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
26         unsigned int size = sizeof(struct page *) * nr;
27
28         if (likely(size <= sbi->page_array_slab_size))
29                 return kmem_cache_zalloc(sbi->page_array_slab, GFP_NOFS);
30         return f2fs_kzalloc(sbi, size, GFP_NOFS);
31 }
32
33 static void page_array_free(struct inode *inode, void *pages, int nr)
34 {
35         struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
36         unsigned int size = sizeof(struct page *) * nr;
37
38         if (!pages)
39                 return;
40
41         if (likely(size <= sbi->page_array_slab_size))
42                 kmem_cache_free(sbi->page_array_slab, pages);
43         else
44                 kfree(pages);
45 }
46
47 struct f2fs_compress_ops {
48         int (*init_compress_ctx)(struct compress_ctx *cc);
49         void (*destroy_compress_ctx)(struct compress_ctx *cc);
50         int (*compress_pages)(struct compress_ctx *cc);
51         int (*init_decompress_ctx)(struct decompress_io_ctx *dic);
52         void (*destroy_decompress_ctx)(struct decompress_io_ctx *dic);
53         int (*decompress_pages)(struct decompress_io_ctx *dic);
54 };
55
56 static unsigned int offset_in_cluster(struct compress_ctx *cc, pgoff_t index)
57 {
58         return index & (cc->cluster_size - 1);
59 }
60
61 static pgoff_t cluster_idx(struct compress_ctx *cc, pgoff_t index)
62 {
63         return index >> cc->log_cluster_size;
64 }
65
66 static pgoff_t start_idx_of_cluster(struct compress_ctx *cc)
67 {
68         return cc->cluster_idx << cc->log_cluster_size;
69 }
70
71 bool f2fs_is_compressed_page(struct page *page)
72 {
73         if (!PagePrivate(page))
74                 return false;
75         if (!page_private(page))
76                 return false;
77         if (IS_ATOMIC_WRITTEN_PAGE(page) || IS_DUMMY_WRITTEN_PAGE(page))
78                 return false;
79
80         f2fs_bug_on(F2FS_M_SB(page->mapping),
81                 *((u32 *)page_private(page)) != F2FS_COMPRESSED_PAGE_MAGIC);
82         return true;
83 }
84
85 static void f2fs_set_compressed_page(struct page *page,
86                 struct inode *inode, pgoff_t index, void *data)
87 {
88         SetPagePrivate(page);
89         set_page_private(page, (unsigned long)data);
90
91         /* i_crypto_info and iv index */
92         page->index = index;
93         page->mapping = inode->i_mapping;
94 }
95
96 static void f2fs_drop_rpages(struct compress_ctx *cc, int len, bool unlock)
97 {
98         int i;
99
100         for (i = 0; i < len; i++) {
101                 if (!cc->rpages[i])
102                         continue;
103                 if (unlock)
104                         unlock_page(cc->rpages[i]);
105                 else
106                         put_page(cc->rpages[i]);
107         }
108 }
109
110 static void f2fs_put_rpages(struct compress_ctx *cc)
111 {
112         f2fs_drop_rpages(cc, cc->cluster_size, false);
113 }
114
115 static void f2fs_unlock_rpages(struct compress_ctx *cc, int len)
116 {
117         f2fs_drop_rpages(cc, len, true);
118 }
119
120 static void f2fs_put_rpages_wbc(struct compress_ctx *cc,
121                 struct writeback_control *wbc, bool redirty, int unlock)
122 {
123         unsigned int i;
124
125         for (i = 0; i < cc->cluster_size; i++) {
126                 if (!cc->rpages[i])
127                         continue;
128                 if (redirty)
129                         redirty_page_for_writepage(wbc, cc->rpages[i]);
130                 f2fs_put_page(cc->rpages[i], unlock);
131         }
132 }
133
134 struct page *f2fs_compress_control_page(struct page *page)
135 {
136         return ((struct compress_io_ctx *)page_private(page))->rpages[0];
137 }
138
139 int f2fs_init_compress_ctx(struct compress_ctx *cc)
140 {
141         if (cc->rpages)
142                 return 0;
143
144         cc->rpages = page_array_alloc(cc->inode, cc->cluster_size);
145         return cc->rpages ? 0 : -ENOMEM;
146 }
147
148 void f2fs_destroy_compress_ctx(struct compress_ctx *cc, bool reuse)
149 {
150         page_array_free(cc->inode, cc->rpages, cc->cluster_size);
151         cc->rpages = NULL;
152         cc->nr_rpages = 0;
153         cc->nr_cpages = 0;
154         if (!reuse)
155                 cc->cluster_idx = NULL_CLUSTER;
156 }
157
158 void f2fs_compress_ctx_add_page(struct compress_ctx *cc, struct page *page)
159 {
160         unsigned int cluster_ofs;
161
162         if (!f2fs_cluster_can_merge_page(cc, page->index))
163                 f2fs_bug_on(F2FS_I_SB(cc->inode), 1);
164
165         cluster_ofs = offset_in_cluster(cc, page->index);
166         cc->rpages[cluster_ofs] = page;
167         cc->nr_rpages++;
168         cc->cluster_idx = cluster_idx(cc, page->index);
169 }
170
171 #ifdef CONFIG_F2FS_FS_LZO
172 static int lzo_init_compress_ctx(struct compress_ctx *cc)
173 {
174         cc->private = f2fs_kvmalloc(F2FS_I_SB(cc->inode),
175                                 LZO1X_MEM_COMPRESS, GFP_NOFS);
176         if (!cc->private)
177                 return -ENOMEM;
178
179         cc->clen = lzo1x_worst_compress(PAGE_SIZE << cc->log_cluster_size);
180         return 0;
181 }
182
183 static void lzo_destroy_compress_ctx(struct compress_ctx *cc)
184 {
185         kvfree(cc->private);
186         cc->private = NULL;
187 }
188
189 static int lzo_compress_pages(struct compress_ctx *cc)
190 {
191         int ret;
192
193         ret = lzo1x_1_compress(cc->rbuf, cc->rlen, cc->cbuf->cdata,
194                                         &cc->clen, cc->private);
195         if (ret != LZO_E_OK) {
196                 printk_ratelimited("%sF2FS-fs (%s): lzo compress failed, ret:%d\n",
197                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id, ret);
198                 return -EIO;
199         }
200         return 0;
201 }
202
203 static int lzo_decompress_pages(struct decompress_io_ctx *dic)
204 {
205         int ret;
206
207         ret = lzo1x_decompress_safe(dic->cbuf->cdata, dic->clen,
208                                                 dic->rbuf, &dic->rlen);
209         if (ret != LZO_E_OK) {
210                 printk_ratelimited("%sF2FS-fs (%s): lzo decompress failed, ret:%d\n",
211                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id, ret);
212                 return -EIO;
213         }
214
215         if (dic->rlen != PAGE_SIZE << dic->log_cluster_size) {
216                 printk_ratelimited("%sF2FS-fs (%s): lzo invalid rlen:%zu, "
217                                         "expected:%lu\n", KERN_ERR,
218                                         F2FS_I_SB(dic->inode)->sb->s_id,
219                                         dic->rlen,
220                                         PAGE_SIZE << dic->log_cluster_size);
221                 return -EIO;
222         }
223         return 0;
224 }
225
226 static const struct f2fs_compress_ops f2fs_lzo_ops = {
227         .init_compress_ctx      = lzo_init_compress_ctx,
228         .destroy_compress_ctx   = lzo_destroy_compress_ctx,
229         .compress_pages         = lzo_compress_pages,
230         .decompress_pages       = lzo_decompress_pages,
231 };
232 #endif
233
234 #ifdef CONFIG_F2FS_FS_LZ4
235 static int lz4_init_compress_ctx(struct compress_ctx *cc)
236 {
237         unsigned int size = LZ4_MEM_COMPRESS;
238
239 #ifdef CONFIG_F2FS_FS_LZ4HC
240         if (F2FS_I(cc->inode)->i_compress_flag >> COMPRESS_LEVEL_OFFSET)
241                 size = LZ4HC_MEM_COMPRESS;
242 #endif
243
244         cc->private = f2fs_kvmalloc(F2FS_I_SB(cc->inode), size, GFP_NOFS);
245         if (!cc->private)
246                 return -ENOMEM;
247
248         /*
249          * we do not change cc->clen to LZ4_compressBound(inputsize) to
250          * adapt worst compress case, because lz4 compressor can handle
251          * output budget properly.
252          */
253         cc->clen = cc->rlen - PAGE_SIZE - COMPRESS_HEADER_SIZE;
254         return 0;
255 }
256
257 static void lz4_destroy_compress_ctx(struct compress_ctx *cc)
258 {
259         kvfree(cc->private);
260         cc->private = NULL;
261 }
262
263 #ifdef CONFIG_F2FS_FS_LZ4HC
264 static int lz4hc_compress_pages(struct compress_ctx *cc)
265 {
266         unsigned char level = F2FS_I(cc->inode)->i_compress_flag >>
267                                                 COMPRESS_LEVEL_OFFSET;
268         int len;
269
270         if (level)
271                 len = LZ4_compress_HC(cc->rbuf, cc->cbuf->cdata, cc->rlen,
272                                         cc->clen, level, cc->private);
273         else
274                 len = LZ4_compress_default(cc->rbuf, cc->cbuf->cdata, cc->rlen,
275                                                 cc->clen, cc->private);
276         if (!len)
277                 return -EAGAIN;
278
279         cc->clen = len;
280         return 0;
281 }
282 #endif
283
284 static int lz4_compress_pages(struct compress_ctx *cc)
285 {
286         int len;
287
288 #ifdef CONFIG_F2FS_FS_LZ4HC
289         return lz4hc_compress_pages(cc);
290 #endif
291         len = LZ4_compress_default(cc->rbuf, cc->cbuf->cdata, cc->rlen,
292                                                 cc->clen, cc->private);
293         if (!len)
294                 return -EAGAIN;
295
296         cc->clen = len;
297         return 0;
298 }
299
300 static int lz4_decompress_pages(struct decompress_io_ctx *dic)
301 {
302         int ret;
303
304         ret = LZ4_decompress_safe(dic->cbuf->cdata, dic->rbuf,
305                                                 dic->clen, dic->rlen);
306         if (ret < 0) {
307                 printk_ratelimited("%sF2FS-fs (%s): lz4 decompress failed, ret:%d\n",
308                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id, ret);
309                 return -EIO;
310         }
311
312         if (ret != PAGE_SIZE << dic->log_cluster_size) {
313                 printk_ratelimited("%sF2FS-fs (%s): lz4 invalid rlen:%zu, "
314                                         "expected:%lu\n", KERN_ERR,
315                                         F2FS_I_SB(dic->inode)->sb->s_id,
316                                         dic->rlen,
317                                         PAGE_SIZE << dic->log_cluster_size);
318                 return -EIO;
319         }
320         return 0;
321 }
322
323 static const struct f2fs_compress_ops f2fs_lz4_ops = {
324         .init_compress_ctx      = lz4_init_compress_ctx,
325         .destroy_compress_ctx   = lz4_destroy_compress_ctx,
326         .compress_pages         = lz4_compress_pages,
327         .decompress_pages       = lz4_decompress_pages,
328 };
329 #endif
330
331 #ifdef CONFIG_F2FS_FS_ZSTD
332 #define F2FS_ZSTD_DEFAULT_CLEVEL        1
333
334 static int zstd_init_compress_ctx(struct compress_ctx *cc)
335 {
336         ZSTD_parameters params;
337         ZSTD_CStream *stream;
338         void *workspace;
339         unsigned int workspace_size;
340         unsigned char level = F2FS_I(cc->inode)->i_compress_flag >>
341                                                 COMPRESS_LEVEL_OFFSET;
342
343         if (!level)
344                 level = F2FS_ZSTD_DEFAULT_CLEVEL;
345
346         params = ZSTD_getParams(level, cc->rlen, 0);
347         workspace_size = ZSTD_CStreamWorkspaceBound(params.cParams);
348
349         workspace = f2fs_kvmalloc(F2FS_I_SB(cc->inode),
350                                         workspace_size, GFP_NOFS);
351         if (!workspace)
352                 return -ENOMEM;
353
354         stream = ZSTD_initCStream(params, 0, workspace, workspace_size);
355         if (!stream) {
356                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_initCStream failed\n",
357                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id,
358                                 __func__);
359                 kvfree(workspace);
360                 return -EIO;
361         }
362
363         cc->private = workspace;
364         cc->private2 = stream;
365
366         cc->clen = cc->rlen - PAGE_SIZE - COMPRESS_HEADER_SIZE;
367         return 0;
368 }
369
370 static void zstd_destroy_compress_ctx(struct compress_ctx *cc)
371 {
372         kvfree(cc->private);
373         cc->private = NULL;
374         cc->private2 = NULL;
375 }
376
377 static int zstd_compress_pages(struct compress_ctx *cc)
378 {
379         ZSTD_CStream *stream = cc->private2;
380         ZSTD_inBuffer inbuf;
381         ZSTD_outBuffer outbuf;
382         int src_size = cc->rlen;
383         int dst_size = src_size - PAGE_SIZE - COMPRESS_HEADER_SIZE;
384         int ret;
385
386         inbuf.pos = 0;
387         inbuf.src = cc->rbuf;
388         inbuf.size = src_size;
389
390         outbuf.pos = 0;
391         outbuf.dst = cc->cbuf->cdata;
392         outbuf.size = dst_size;
393
394         ret = ZSTD_compressStream(stream, &outbuf, &inbuf);
395         if (ZSTD_isError(ret)) {
396                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_compressStream failed, ret: %d\n",
397                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id,
398                                 __func__, ZSTD_getErrorCode(ret));
399                 return -EIO;
400         }
401
402         ret = ZSTD_endStream(stream, &outbuf);
403         if (ZSTD_isError(ret)) {
404                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_endStream returned %d\n",
405                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id,
406                                 __func__, ZSTD_getErrorCode(ret));
407                 return -EIO;
408         }
409
410         /*
411          * there is compressed data remained in intermediate buffer due to
412          * no more space in cbuf.cdata
413          */
414         if (ret)
415                 return -EAGAIN;
416
417         cc->clen = outbuf.pos;
418         return 0;
419 }
420
421 static int zstd_init_decompress_ctx(struct decompress_io_ctx *dic)
422 {
423         ZSTD_DStream *stream;
424         void *workspace;
425         unsigned int workspace_size;
426         unsigned int max_window_size =
427                         MAX_COMPRESS_WINDOW_SIZE(dic->log_cluster_size);
428
429         workspace_size = ZSTD_DStreamWorkspaceBound(max_window_size);
430
431         workspace = f2fs_kvmalloc(F2FS_I_SB(dic->inode),
432                                         workspace_size, GFP_NOFS);
433         if (!workspace)
434                 return -ENOMEM;
435
436         stream = ZSTD_initDStream(max_window_size, workspace, workspace_size);
437         if (!stream) {
438                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_initDStream failed\n",
439                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id,
440                                 __func__);
441                 kvfree(workspace);
442                 return -EIO;
443         }
444
445         dic->private = workspace;
446         dic->private2 = stream;
447
448         return 0;
449 }
450
451 static void zstd_destroy_decompress_ctx(struct decompress_io_ctx *dic)
452 {
453         kvfree(dic->private);
454         dic->private = NULL;
455         dic->private2 = NULL;
456 }
457
458 static int zstd_decompress_pages(struct decompress_io_ctx *dic)
459 {
460         ZSTD_DStream *stream = dic->private2;
461         ZSTD_inBuffer inbuf;
462         ZSTD_outBuffer outbuf;
463         int ret;
464
465         inbuf.pos = 0;
466         inbuf.src = dic->cbuf->cdata;
467         inbuf.size = dic->clen;
468
469         outbuf.pos = 0;
470         outbuf.dst = dic->rbuf;
471         outbuf.size = dic->rlen;
472
473         ret = ZSTD_decompressStream(stream, &outbuf, &inbuf);
474         if (ZSTD_isError(ret)) {
475                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_compressStream failed, ret: %d\n",
476                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id,
477                                 __func__, ZSTD_getErrorCode(ret));
478                 return -EIO;
479         }
480
481         if (dic->rlen != outbuf.pos) {
482                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD invalid rlen:%zu, "
483                                 "expected:%lu\n", KERN_ERR,
484                                 F2FS_I_SB(dic->inode)->sb->s_id,
485                                 __func__, dic->rlen,
486                                 PAGE_SIZE << dic->log_cluster_size);
487                 return -EIO;
488         }
489
490         return 0;
491 }
492
493 static const struct f2fs_compress_ops f2fs_zstd_ops = {
494         .init_compress_ctx      = zstd_init_compress_ctx,
495         .destroy_compress_ctx   = zstd_destroy_compress_ctx,
496         .compress_pages         = zstd_compress_pages,
497         .init_decompress_ctx    = zstd_init_decompress_ctx,
498         .destroy_decompress_ctx = zstd_destroy_decompress_ctx,
499         .decompress_pages       = zstd_decompress_pages,
500 };
501 #endif
502
503 #ifdef CONFIG_F2FS_FS_LZO
504 #ifdef CONFIG_F2FS_FS_LZORLE
505 static int lzorle_compress_pages(struct compress_ctx *cc)
506 {
507         int ret;
508
509         ret = lzorle1x_1_compress(cc->rbuf, cc->rlen, cc->cbuf->cdata,
510                                         &cc->clen, cc->private);
511         if (ret != LZO_E_OK) {
512                 printk_ratelimited("%sF2FS-fs (%s): lzo-rle compress failed, ret:%d\n",
513                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id, ret);
514                 return -EIO;
515         }
516         return 0;
517 }
518
519 static const struct f2fs_compress_ops f2fs_lzorle_ops = {
520         .init_compress_ctx      = lzo_init_compress_ctx,
521         .destroy_compress_ctx   = lzo_destroy_compress_ctx,
522         .compress_pages         = lzorle_compress_pages,
523         .decompress_pages       = lzo_decompress_pages,
524 };
525 #endif
526 #endif
527
528 static const struct f2fs_compress_ops *f2fs_cops[COMPRESS_MAX] = {
529 #ifdef CONFIG_F2FS_FS_LZO
530         &f2fs_lzo_ops,
531 #else
532         NULL,
533 #endif
534 #ifdef CONFIG_F2FS_FS_LZ4
535         &f2fs_lz4_ops,
536 #else
537         NULL,
538 #endif
539 #ifdef CONFIG_F2FS_FS_ZSTD
540         &f2fs_zstd_ops,
541 #else
542         NULL,
543 #endif
544 #if defined(CONFIG_F2FS_FS_LZO) && defined(CONFIG_F2FS_FS_LZORLE)
545         &f2fs_lzorle_ops,
546 #else
547         NULL,
548 #endif
549 };
550
551 bool f2fs_is_compress_backend_ready(struct inode *inode)
552 {
553         if (!f2fs_compressed_file(inode))
554                 return true;
555         return f2fs_cops[F2FS_I(inode)->i_compress_algorithm];
556 }
557
558 static mempool_t *compress_page_pool;
559 static int num_compress_pages = 512;
560 module_param(num_compress_pages, uint, 0444);
561 MODULE_PARM_DESC(num_compress_pages,
562                 "Number of intermediate compress pages to preallocate");
563
564 int f2fs_init_compress_mempool(void)
565 {
566         compress_page_pool = mempool_create_page_pool(num_compress_pages, 0);
567         if (!compress_page_pool)
568                 return -ENOMEM;
569
570         return 0;
571 }
572
573 void f2fs_destroy_compress_mempool(void)
574 {
575         mempool_destroy(compress_page_pool);
576 }
577
578 static struct page *f2fs_compress_alloc_page(void)
579 {
580         struct page *page;
581
582         page = mempool_alloc(compress_page_pool, GFP_NOFS);
583         lock_page(page);
584
585         return page;
586 }
587
588 static void f2fs_compress_free_page(struct page *page)
589 {
590         if (!page)
591                 return;
592         set_page_private(page, (unsigned long)NULL);
593         ClearPagePrivate(page);
594         page->mapping = NULL;
595         unlock_page(page);
596         mempool_free(page, compress_page_pool);
597 }
598
599 #define MAX_VMAP_RETRIES        3
600
601 static void *f2fs_vmap(struct page **pages, unsigned int count)
602 {
603         int i;
604         void *buf = NULL;
605
606         for (i = 0; i < MAX_VMAP_RETRIES; i++) {
607                 buf = vm_map_ram(pages, count, -1);
608                 if (buf)
609                         break;
610                 vm_unmap_aliases();
611         }
612         return buf;
613 }
614
615 static int f2fs_compress_pages(struct compress_ctx *cc)
616 {
617         struct f2fs_inode_info *fi = F2FS_I(cc->inode);
618         const struct f2fs_compress_ops *cops =
619                                 f2fs_cops[fi->i_compress_algorithm];
620         unsigned int max_len, new_nr_cpages;
621         struct page **new_cpages;
622         u32 chksum = 0;
623         int i, ret;
624
625         trace_f2fs_compress_pages_start(cc->inode, cc->cluster_idx,
626                                 cc->cluster_size, fi->i_compress_algorithm);
627
628         if (cops->init_compress_ctx) {
629                 ret = cops->init_compress_ctx(cc);
630                 if (ret)
631                         goto out;
632         }
633
634         max_len = COMPRESS_HEADER_SIZE + cc->clen;
635         cc->nr_cpages = DIV_ROUND_UP(max_len, PAGE_SIZE);
636
637         cc->cpages = page_array_alloc(cc->inode, cc->nr_cpages);
638         if (!cc->cpages) {
639                 ret = -ENOMEM;
640                 goto destroy_compress_ctx;
641         }
642
643         for (i = 0; i < cc->nr_cpages; i++) {
644                 cc->cpages[i] = f2fs_compress_alloc_page();
645                 if (!cc->cpages[i]) {
646                         ret = -ENOMEM;
647                         goto out_free_cpages;
648                 }
649         }
650
651         cc->rbuf = f2fs_vmap(cc->rpages, cc->cluster_size);
652         if (!cc->rbuf) {
653                 ret = -ENOMEM;
654                 goto out_free_cpages;
655         }
656
657         cc->cbuf = f2fs_vmap(cc->cpages, cc->nr_cpages);
658         if (!cc->cbuf) {
659                 ret = -ENOMEM;
660                 goto out_vunmap_rbuf;
661         }
662
663         ret = cops->compress_pages(cc);
664         if (ret)
665                 goto out_vunmap_cbuf;
666
667         max_len = PAGE_SIZE * (cc->cluster_size - 1) - COMPRESS_HEADER_SIZE;
668
669         if (cc->clen > max_len) {
670                 ret = -EAGAIN;
671                 goto out_vunmap_cbuf;
672         }
673
674         cc->cbuf->clen = cpu_to_le32(cc->clen);
675
676         if (fi->i_compress_flag & 1 << COMPRESS_CHKSUM)
677                 chksum = f2fs_crc32(F2FS_I_SB(cc->inode),
678                                         cc->cbuf->cdata, cc->clen);
679         cc->cbuf->chksum = cpu_to_le32(chksum);
680
681         for (i = 0; i < COMPRESS_DATA_RESERVED_SIZE; i++)
682                 cc->cbuf->reserved[i] = cpu_to_le32(0);
683
684         new_nr_cpages = DIV_ROUND_UP(cc->clen + COMPRESS_HEADER_SIZE, PAGE_SIZE);
685
686         /* Now we're going to cut unnecessary tail pages */
687         new_cpages = page_array_alloc(cc->inode, new_nr_cpages);
688         if (!new_cpages) {
689                 ret = -ENOMEM;
690                 goto out_vunmap_cbuf;
691         }
692
693         /* zero out any unused part of the last page */
694         memset(&cc->cbuf->cdata[cc->clen], 0,
695                         (new_nr_cpages * PAGE_SIZE) -
696                         (cc->clen + COMPRESS_HEADER_SIZE));
697
698         vm_unmap_ram(cc->cbuf, cc->nr_cpages);
699         vm_unmap_ram(cc->rbuf, cc->cluster_size);
700
701         for (i = 0; i < cc->nr_cpages; i++) {
702                 if (i < new_nr_cpages) {
703                         new_cpages[i] = cc->cpages[i];
704                         continue;
705                 }
706                 f2fs_compress_free_page(cc->cpages[i]);
707                 cc->cpages[i] = NULL;
708         }
709
710         if (cops->destroy_compress_ctx)
711                 cops->destroy_compress_ctx(cc);
712
713         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
714         cc->cpages = new_cpages;
715         cc->nr_cpages = new_nr_cpages;
716
717         trace_f2fs_compress_pages_end(cc->inode, cc->cluster_idx,
718                                                         cc->clen, ret);
719         return 0;
720
721 out_vunmap_cbuf:
722         vm_unmap_ram(cc->cbuf, cc->nr_cpages);
723 out_vunmap_rbuf:
724         vm_unmap_ram(cc->rbuf, cc->cluster_size);
725 out_free_cpages:
726         for (i = 0; i < cc->nr_cpages; i++) {
727                 if (cc->cpages[i])
728                         f2fs_compress_free_page(cc->cpages[i]);
729         }
730         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
731         cc->cpages = NULL;
732 destroy_compress_ctx:
733         if (cops->destroy_compress_ctx)
734                 cops->destroy_compress_ctx(cc);
735 out:
736         trace_f2fs_compress_pages_end(cc->inode, cc->cluster_idx,
737                                                         cc->clen, ret);
738         return ret;
739 }
740
741 static void f2fs_decompress_cluster(struct decompress_io_ctx *dic)
742 {
743         struct f2fs_sb_info *sbi = F2FS_I_SB(dic->inode);
744         struct f2fs_inode_info *fi = F2FS_I(dic->inode);
745         const struct f2fs_compress_ops *cops =
746                         f2fs_cops[fi->i_compress_algorithm];
747         int ret;
748         int i;
749
750         trace_f2fs_decompress_pages_start(dic->inode, dic->cluster_idx,
751                                 dic->cluster_size, fi->i_compress_algorithm);
752
753         if (dic->failed) {
754                 ret = -EIO;
755                 goto out_end_io;
756         }
757
758         dic->tpages = page_array_alloc(dic->inode, dic->cluster_size);
759         if (!dic->tpages) {
760                 ret = -ENOMEM;
761                 goto out_end_io;
762         }
763
764         for (i = 0; i < dic->cluster_size; i++) {
765                 if (dic->rpages[i]) {
766                         dic->tpages[i] = dic->rpages[i];
767                         continue;
768                 }
769
770                 dic->tpages[i] = f2fs_compress_alloc_page();
771                 if (!dic->tpages[i]) {
772                         ret = -ENOMEM;
773                         goto out_end_io;
774                 }
775         }
776
777         if (cops->init_decompress_ctx) {
778                 ret = cops->init_decompress_ctx(dic);
779                 if (ret)
780                         goto out_end_io;
781         }
782
783         dic->rbuf = f2fs_vmap(dic->tpages, dic->cluster_size);
784         if (!dic->rbuf) {
785                 ret = -ENOMEM;
786                 goto out_destroy_decompress_ctx;
787         }
788
789         dic->cbuf = f2fs_vmap(dic->cpages, dic->nr_cpages);
790         if (!dic->cbuf) {
791                 ret = -ENOMEM;
792                 goto out_vunmap_rbuf;
793         }
794
795         dic->clen = le32_to_cpu(dic->cbuf->clen);
796         dic->rlen = PAGE_SIZE << dic->log_cluster_size;
797
798         if (dic->clen > PAGE_SIZE * dic->nr_cpages - COMPRESS_HEADER_SIZE) {
799                 ret = -EFSCORRUPTED;
800                 goto out_vunmap_cbuf;
801         }
802
803         ret = cops->decompress_pages(dic);
804
805         if (!ret && (fi->i_compress_flag & 1 << COMPRESS_CHKSUM)) {
806                 u32 provided = le32_to_cpu(dic->cbuf->chksum);
807                 u32 calculated = f2fs_crc32(sbi, dic->cbuf->cdata, dic->clen);
808
809                 if (provided != calculated) {
810                         if (!is_inode_flag_set(dic->inode, FI_COMPRESS_CORRUPT)) {
811                                 set_inode_flag(dic->inode, FI_COMPRESS_CORRUPT);
812                                 printk_ratelimited(
813                                         "%sF2FS-fs (%s): checksum invalid, nid = %lu, %x vs %x",
814                                         KERN_INFO, sbi->sb->s_id, dic->inode->i_ino,
815                                         provided, calculated);
816                         }
817                         set_sbi_flag(sbi, SBI_NEED_FSCK);
818                 }
819         }
820
821 out_vunmap_cbuf:
822         vm_unmap_ram(dic->cbuf, dic->nr_cpages);
823 out_vunmap_rbuf:
824         vm_unmap_ram(dic->rbuf, dic->cluster_size);
825 out_destroy_decompress_ctx:
826         if (cops->destroy_decompress_ctx)
827                 cops->destroy_decompress_ctx(dic);
828 out_end_io:
829         trace_f2fs_decompress_pages_end(dic->inode, dic->cluster_idx,
830                                                         dic->clen, ret);
831         f2fs_decompress_end_io(dic, ret);
832 }
833
834 /*
835  * This is called when a page of a compressed cluster has been read from disk
836  * (or failed to be read from disk).  It checks whether this page was the last
837  * page being waited on in the cluster, and if so, it decompresses the cluster
838  * (or in the case of a failure, cleans up without actually decompressing).
839  */
840 void f2fs_end_read_compressed_page(struct page *page, bool failed)
841 {
842         struct decompress_io_ctx *dic =
843                         (struct decompress_io_ctx *)page_private(page);
844         struct f2fs_sb_info *sbi = F2FS_I_SB(dic->inode);
845
846         dec_page_count(sbi, F2FS_RD_DATA);
847
848         if (failed)
849                 WRITE_ONCE(dic->failed, true);
850
851         if (atomic_dec_and_test(&dic->remaining_pages))
852                 f2fs_decompress_cluster(dic);
853 }
854
855 static bool is_page_in_cluster(struct compress_ctx *cc, pgoff_t index)
856 {
857         if (cc->cluster_idx == NULL_CLUSTER)
858                 return true;
859         return cc->cluster_idx == cluster_idx(cc, index);
860 }
861
862 bool f2fs_cluster_is_empty(struct compress_ctx *cc)
863 {
864         return cc->nr_rpages == 0;
865 }
866
867 static bool f2fs_cluster_is_full(struct compress_ctx *cc)
868 {
869         return cc->cluster_size == cc->nr_rpages;
870 }
871
872 bool f2fs_cluster_can_merge_page(struct compress_ctx *cc, pgoff_t index)
873 {
874         if (f2fs_cluster_is_empty(cc))
875                 return true;
876         return is_page_in_cluster(cc, index);
877 }
878
879 static bool cluster_has_invalid_data(struct compress_ctx *cc)
880 {
881         loff_t i_size = i_size_read(cc->inode);
882         unsigned nr_pages = DIV_ROUND_UP(i_size, PAGE_SIZE);
883         int i;
884
885         for (i = 0; i < cc->cluster_size; i++) {
886                 struct page *page = cc->rpages[i];
887
888                 f2fs_bug_on(F2FS_I_SB(cc->inode), !page);
889
890                 /* beyond EOF */
891                 if (page->index >= nr_pages)
892                         return true;
893         }
894         return false;
895 }
896
897 static int __f2fs_cluster_blocks(struct compress_ctx *cc, bool compr)
898 {
899         struct dnode_of_data dn;
900         int ret;
901
902         set_new_dnode(&dn, cc->inode, NULL, NULL, 0);
903         ret = f2fs_get_dnode_of_data(&dn, start_idx_of_cluster(cc),
904                                                         LOOKUP_NODE);
905         if (ret) {
906                 if (ret == -ENOENT)
907                         ret = 0;
908                 goto fail;
909         }
910
911         if (dn.data_blkaddr == COMPRESS_ADDR) {
912                 int i;
913
914                 ret = 1;
915                 for (i = 1; i < cc->cluster_size; i++) {
916                         block_t blkaddr;
917
918                         blkaddr = data_blkaddr(dn.inode,
919                                         dn.node_page, dn.ofs_in_node + i);
920                         if (compr) {
921                                 if (__is_valid_data_blkaddr(blkaddr))
922                                         ret++;
923                         } else {
924                                 if (blkaddr != NULL_ADDR)
925                                         ret++;
926                         }
927                 }
928         }
929 fail:
930         f2fs_put_dnode(&dn);
931         return ret;
932 }
933
934 /* return # of compressed blocks in compressed cluster */
935 static int f2fs_compressed_blocks(struct compress_ctx *cc)
936 {
937         return __f2fs_cluster_blocks(cc, true);
938 }
939
940 /* return # of valid blocks in compressed cluster */
941 static int f2fs_cluster_blocks(struct compress_ctx *cc)
942 {
943         return __f2fs_cluster_blocks(cc, false);
944 }
945
946 int f2fs_is_compressed_cluster(struct inode *inode, pgoff_t index)
947 {
948         struct compress_ctx cc = {
949                 .inode = inode,
950                 .log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
951                 .cluster_size = F2FS_I(inode)->i_cluster_size,
952                 .cluster_idx = index >> F2FS_I(inode)->i_log_cluster_size,
953         };
954
955         return f2fs_cluster_blocks(&cc);
956 }
957
958 static bool cluster_may_compress(struct compress_ctx *cc)
959 {
960         if (!f2fs_need_compress_data(cc->inode))
961                 return false;
962         if (f2fs_is_atomic_file(cc->inode))
963                 return false;
964         if (f2fs_is_mmap_file(cc->inode))
965                 return false;
966         if (!f2fs_cluster_is_full(cc))
967                 return false;
968         if (unlikely(f2fs_cp_error(F2FS_I_SB(cc->inode))))
969                 return false;
970         return !cluster_has_invalid_data(cc);
971 }
972
973 static void set_cluster_writeback(struct compress_ctx *cc)
974 {
975         int i;
976
977         for (i = 0; i < cc->cluster_size; i++) {
978                 if (cc->rpages[i])
979                         set_page_writeback(cc->rpages[i]);
980         }
981 }
982
983 static void set_cluster_dirty(struct compress_ctx *cc)
984 {
985         int i;
986
987         for (i = 0; i < cc->cluster_size; i++)
988                 if (cc->rpages[i])
989                         set_page_dirty(cc->rpages[i]);
990 }
991
992 static int prepare_compress_overwrite(struct compress_ctx *cc,
993                 struct page **pagep, pgoff_t index, void **fsdata)
994 {
995         struct f2fs_sb_info *sbi = F2FS_I_SB(cc->inode);
996         struct address_space *mapping = cc->inode->i_mapping;
997         struct page *page;
998         struct dnode_of_data dn;
999         sector_t last_block_in_bio;
1000         unsigned fgp_flag = FGP_LOCK | FGP_WRITE | FGP_CREAT;
1001         pgoff_t start_idx = start_idx_of_cluster(cc);
1002         int i, ret;
1003         bool prealloc;
1004
1005 retry:
1006         ret = f2fs_cluster_blocks(cc);
1007         if (ret <= 0)
1008                 return ret;
1009
1010         /* compressed case */
1011         prealloc = (ret < cc->cluster_size);
1012
1013         ret = f2fs_init_compress_ctx(cc);
1014         if (ret)
1015                 return ret;
1016
1017         /* keep page reference to avoid page reclaim */
1018         for (i = 0; i < cc->cluster_size; i++) {
1019                 page = f2fs_pagecache_get_page(mapping, start_idx + i,
1020                                                         fgp_flag, GFP_NOFS);
1021                 if (!page) {
1022                         ret = -ENOMEM;
1023                         goto unlock_pages;
1024                 }
1025
1026                 if (PageUptodate(page))
1027                         f2fs_put_page(page, 1);
1028                 else
1029                         f2fs_compress_ctx_add_page(cc, page);
1030         }
1031
1032         if (!f2fs_cluster_is_empty(cc)) {
1033                 struct bio *bio = NULL;
1034
1035                 ret = f2fs_read_multi_pages(cc, &bio, cc->cluster_size,
1036                                         &last_block_in_bio, false, true);
1037                 f2fs_put_rpages(cc);
1038                 f2fs_destroy_compress_ctx(cc, true);
1039                 if (ret)
1040                         goto out;
1041                 if (bio)
1042                         f2fs_submit_bio(sbi, bio, DATA);
1043
1044                 ret = f2fs_init_compress_ctx(cc);
1045                 if (ret)
1046                         goto out;
1047         }
1048
1049         for (i = 0; i < cc->cluster_size; i++) {
1050                 f2fs_bug_on(sbi, cc->rpages[i]);
1051
1052                 page = find_lock_page(mapping, start_idx + i);
1053                 if (!page) {
1054                         /* page can be truncated */
1055                         goto release_and_retry;
1056                 }
1057
1058                 f2fs_wait_on_page_writeback(page, DATA, true, true);
1059                 f2fs_compress_ctx_add_page(cc, page);
1060
1061                 if (!PageUptodate(page)) {
1062 release_and_retry:
1063                         f2fs_put_rpages(cc);
1064                         f2fs_unlock_rpages(cc, i + 1);
1065                         f2fs_destroy_compress_ctx(cc, true);
1066                         goto retry;
1067                 }
1068         }
1069
1070         if (prealloc) {
1071                 f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, true);
1072
1073                 set_new_dnode(&dn, cc->inode, NULL, NULL, 0);
1074
1075                 for (i = cc->cluster_size - 1; i > 0; i--) {
1076                         ret = f2fs_get_block(&dn, start_idx + i);
1077                         if (ret) {
1078                                 i = cc->cluster_size;
1079                                 break;
1080                         }
1081
1082                         if (dn.data_blkaddr != NEW_ADDR)
1083                                 break;
1084                 }
1085
1086                 f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, false);
1087         }
1088
1089         if (likely(!ret)) {
1090                 *fsdata = cc->rpages;
1091                 *pagep = cc->rpages[offset_in_cluster(cc, index)];
1092                 return cc->cluster_size;
1093         }
1094
1095 unlock_pages:
1096         f2fs_put_rpages(cc);
1097         f2fs_unlock_rpages(cc, i);
1098         f2fs_destroy_compress_ctx(cc, true);
1099 out:
1100         return ret;
1101 }
1102
1103 int f2fs_prepare_compress_overwrite(struct inode *inode,
1104                 struct page **pagep, pgoff_t index, void **fsdata)
1105 {
1106         struct compress_ctx cc = {
1107                 .inode = inode,
1108                 .log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
1109                 .cluster_size = F2FS_I(inode)->i_cluster_size,
1110                 .cluster_idx = index >> F2FS_I(inode)->i_log_cluster_size,
1111                 .rpages = NULL,
1112                 .nr_rpages = 0,
1113         };
1114
1115         return prepare_compress_overwrite(&cc, pagep, index, fsdata);
1116 }
1117
1118 bool f2fs_compress_write_end(struct inode *inode, void *fsdata,
1119                                         pgoff_t index, unsigned copied)
1120
1121 {
1122         struct compress_ctx cc = {
1123                 .inode = inode,
1124                 .log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
1125                 .cluster_size = F2FS_I(inode)->i_cluster_size,
1126                 .rpages = fsdata,
1127         };
1128         bool first_index = (index == cc.rpages[0]->index);
1129
1130         if (copied)
1131                 set_cluster_dirty(&cc);
1132
1133         f2fs_put_rpages_wbc(&cc, NULL, false, 1);
1134         f2fs_destroy_compress_ctx(&cc, false);
1135
1136         return first_index;
1137 }
1138
1139 int f2fs_truncate_partial_cluster(struct inode *inode, u64 from, bool lock)
1140 {
1141         void *fsdata = NULL;
1142         struct page *pagep;
1143         int log_cluster_size = F2FS_I(inode)->i_log_cluster_size;
1144         pgoff_t start_idx = from >> (PAGE_SHIFT + log_cluster_size) <<
1145                                                         log_cluster_size;
1146         int err;
1147
1148         err = f2fs_is_compressed_cluster(inode, start_idx);
1149         if (err < 0)
1150                 return err;
1151
1152         /* truncate normal cluster */
1153         if (!err)
1154                 return f2fs_do_truncate_blocks(inode, from, lock);
1155
1156         /* truncate compressed cluster */
1157         err = f2fs_prepare_compress_overwrite(inode, &pagep,
1158                                                 start_idx, &fsdata);
1159
1160         /* should not be a normal cluster */
1161         f2fs_bug_on(F2FS_I_SB(inode), err == 0);
1162
1163         if (err <= 0)
1164                 return err;
1165
1166         if (err > 0) {
1167                 struct page **rpages = fsdata;
1168                 int cluster_size = F2FS_I(inode)->i_cluster_size;
1169                 int i;
1170
1171                 for (i = cluster_size - 1; i >= 0; i--) {
1172                         loff_t start = rpages[i]->index << PAGE_SHIFT;
1173
1174                         if (from <= start) {
1175                                 zero_user_segment(rpages[i], 0, PAGE_SIZE);
1176                         } else {
1177                                 zero_user_segment(rpages[i], from - start,
1178                                                                 PAGE_SIZE);
1179                                 break;
1180                         }
1181                 }
1182
1183                 f2fs_compress_write_end(inode, fsdata, start_idx, true);
1184         }
1185         return 0;
1186 }
1187
1188 static int f2fs_write_compressed_pages(struct compress_ctx *cc,
1189                                         int *submitted,
1190                                         struct writeback_control *wbc,
1191                                         enum iostat_type io_type)
1192 {
1193         struct inode *inode = cc->inode;
1194         struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1195         struct f2fs_inode_info *fi = F2FS_I(inode);
1196         struct f2fs_io_info fio = {
1197                 .sbi = sbi,
1198                 .ino = cc->inode->i_ino,
1199                 .type = DATA,
1200                 .op = REQ_OP_WRITE,
1201                 .op_flags = wbc_to_write_flags(wbc),
1202                 .old_blkaddr = NEW_ADDR,
1203                 .page = NULL,
1204                 .encrypted_page = NULL,
1205                 .compressed_page = NULL,
1206                 .submitted = false,
1207                 .io_type = io_type,
1208                 .io_wbc = wbc,
1209                 .encrypted = fscrypt_inode_uses_fs_layer_crypto(cc->inode),
1210         };
1211         struct dnode_of_data dn;
1212         struct node_info ni;
1213         struct compress_io_ctx *cic;
1214         pgoff_t start_idx = start_idx_of_cluster(cc);
1215         unsigned int last_index = cc->cluster_size - 1;
1216         loff_t psize;
1217         int i, err;
1218
1219         /* we should bypass data pages to proceed the kworkder jobs */
1220         if (unlikely(f2fs_cp_error(sbi))) {
1221                 mapping_set_error(cc->rpages[0]->mapping, -EIO);
1222                 goto out_free;
1223         }
1224
1225         if (IS_NOQUOTA(inode)) {
1226                 /*
1227                  * We need to wait for node_write to avoid block allocation during
1228                  * checkpoint. This can only happen to quota writes which can cause
1229                  * the below discard race condition.
1230                  */
1231                 down_read(&sbi->node_write);
1232         } else if (!f2fs_trylock_op(sbi)) {
1233                 goto out_free;
1234         }
1235
1236         set_new_dnode(&dn, cc->inode, NULL, NULL, 0);
1237
1238         err = f2fs_get_dnode_of_data(&dn, start_idx, LOOKUP_NODE);
1239         if (err)
1240                 goto out_unlock_op;
1241
1242         for (i = 0; i < cc->cluster_size; i++) {
1243                 if (data_blkaddr(dn.inode, dn.node_page,
1244                                         dn.ofs_in_node + i) == NULL_ADDR)
1245                         goto out_put_dnode;
1246         }
1247
1248         psize = (loff_t)(cc->rpages[last_index]->index + 1) << PAGE_SHIFT;
1249
1250         err = f2fs_get_node_info(fio.sbi, dn.nid, &ni);
1251         if (err)
1252                 goto out_put_dnode;
1253
1254         fio.version = ni.version;
1255
1256         cic = kmem_cache_zalloc(cic_entry_slab, GFP_NOFS);
1257         if (!cic)
1258                 goto out_put_dnode;
1259
1260         cic->magic = F2FS_COMPRESSED_PAGE_MAGIC;
1261         cic->inode = inode;
1262         atomic_set(&cic->pending_pages, cc->nr_cpages);
1263         cic->rpages = page_array_alloc(cc->inode, cc->cluster_size);
1264         if (!cic->rpages)
1265                 goto out_put_cic;
1266
1267         cic->nr_rpages = cc->cluster_size;
1268
1269         for (i = 0; i < cc->nr_cpages; i++) {
1270                 f2fs_set_compressed_page(cc->cpages[i], inode,
1271                                         cc->rpages[i + 1]->index, cic);
1272                 fio.compressed_page = cc->cpages[i];
1273
1274                 fio.old_blkaddr = data_blkaddr(dn.inode, dn.node_page,
1275                                                 dn.ofs_in_node + i + 1);
1276
1277                 /* wait for GCed page writeback via META_MAPPING */
1278                 f2fs_wait_on_block_writeback(inode, fio.old_blkaddr);
1279
1280                 if (fio.encrypted) {
1281                         fio.page = cc->rpages[i + 1];
1282                         err = f2fs_encrypt_one_page(&fio);
1283                         if (err)
1284                                 goto out_destroy_crypt;
1285                         cc->cpages[i] = fio.encrypted_page;
1286                 }
1287         }
1288
1289         set_cluster_writeback(cc);
1290
1291         for (i = 0; i < cc->cluster_size; i++)
1292                 cic->rpages[i] = cc->rpages[i];
1293
1294         for (i = 0; i < cc->cluster_size; i++, dn.ofs_in_node++) {
1295                 block_t blkaddr;
1296
1297                 blkaddr = f2fs_data_blkaddr(&dn);
1298                 fio.page = cc->rpages[i];
1299                 fio.old_blkaddr = blkaddr;
1300
1301                 /* cluster header */
1302                 if (i == 0) {
1303                         if (blkaddr == COMPRESS_ADDR)
1304                                 fio.compr_blocks++;
1305                         if (__is_valid_data_blkaddr(blkaddr))
1306                                 f2fs_invalidate_blocks(sbi, blkaddr);
1307                         f2fs_update_data_blkaddr(&dn, COMPRESS_ADDR);
1308                         goto unlock_continue;
1309                 }
1310
1311                 if (fio.compr_blocks && __is_valid_data_blkaddr(blkaddr))
1312                         fio.compr_blocks++;
1313
1314                 if (i > cc->nr_cpages) {
1315                         if (__is_valid_data_blkaddr(blkaddr)) {
1316                                 f2fs_invalidate_blocks(sbi, blkaddr);
1317                                 f2fs_update_data_blkaddr(&dn, NEW_ADDR);
1318                         }
1319                         goto unlock_continue;
1320                 }
1321
1322                 f2fs_bug_on(fio.sbi, blkaddr == NULL_ADDR);
1323
1324                 if (fio.encrypted)
1325                         fio.encrypted_page = cc->cpages[i - 1];
1326                 else
1327                         fio.compressed_page = cc->cpages[i - 1];
1328
1329                 cc->cpages[i - 1] = NULL;
1330                 f2fs_outplace_write_data(&dn, &fio);
1331                 (*submitted)++;
1332 unlock_continue:
1333                 inode_dec_dirty_pages(cc->inode);
1334                 unlock_page(fio.page);
1335         }
1336
1337         if (fio.compr_blocks)
1338                 f2fs_i_compr_blocks_update(inode, fio.compr_blocks - 1, false);
1339         f2fs_i_compr_blocks_update(inode, cc->nr_cpages, true);
1340         add_compr_block_stat(inode, cc->nr_cpages);
1341
1342         set_inode_flag(cc->inode, FI_APPEND_WRITE);
1343         if (cc->cluster_idx == 0)
1344                 set_inode_flag(inode, FI_FIRST_BLOCK_WRITTEN);
1345
1346         f2fs_put_dnode(&dn);
1347         if (IS_NOQUOTA(inode))
1348                 up_read(&sbi->node_write);
1349         else
1350                 f2fs_unlock_op(sbi);
1351
1352         spin_lock(&fi->i_size_lock);
1353         if (fi->last_disk_size < psize)
1354                 fi->last_disk_size = psize;
1355         spin_unlock(&fi->i_size_lock);
1356
1357         f2fs_put_rpages(cc);
1358         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
1359         cc->cpages = NULL;
1360         f2fs_destroy_compress_ctx(cc, false);
1361         return 0;
1362
1363 out_destroy_crypt:
1364         page_array_free(cc->inode, cic->rpages, cc->cluster_size);
1365
1366         for (--i; i >= 0; i--)
1367                 fscrypt_finalize_bounce_page(&cc->cpages[i]);
1368         for (i = 0; i < cc->nr_cpages; i++) {
1369                 if (!cc->cpages[i])
1370                         continue;
1371                 f2fs_compress_free_page(cc->cpages[i]);
1372                 cc->cpages[i] = NULL;
1373         }
1374 out_put_cic:
1375         kmem_cache_free(cic_entry_slab, cic);
1376 out_put_dnode:
1377         f2fs_put_dnode(&dn);
1378 out_unlock_op:
1379         if (IS_NOQUOTA(inode))
1380                 up_read(&sbi->node_write);
1381         else
1382                 f2fs_unlock_op(sbi);
1383 out_free:
1384         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
1385         cc->cpages = NULL;
1386         return -EAGAIN;
1387 }
1388
1389 void f2fs_compress_write_end_io(struct bio *bio, struct page *page)
1390 {
1391         struct f2fs_sb_info *sbi = bio->bi_private;
1392         struct compress_io_ctx *cic =
1393                         (struct compress_io_ctx *)page_private(page);
1394         int i;
1395
1396         if (unlikely(bio->bi_status))
1397                 mapping_set_error(cic->inode->i_mapping, -EIO);
1398
1399         f2fs_compress_free_page(page);
1400
1401         dec_page_count(sbi, F2FS_WB_DATA);
1402
1403         if (atomic_dec_return(&cic->pending_pages))
1404                 return;
1405
1406         for (i = 0; i < cic->nr_rpages; i++) {
1407                 WARN_ON(!cic->rpages[i]);
1408                 clear_cold_data(cic->rpages[i]);
1409                 end_page_writeback(cic->rpages[i]);
1410         }
1411
1412         page_array_free(cic->inode, cic->rpages, cic->nr_rpages);
1413         kmem_cache_free(cic_entry_slab, cic);
1414 }
1415
1416 static int f2fs_write_raw_pages(struct compress_ctx *cc,
1417                                         int *submitted,
1418                                         struct writeback_control *wbc,
1419                                         enum iostat_type io_type)
1420 {
1421         struct address_space *mapping = cc->inode->i_mapping;
1422         int _submitted, compr_blocks, ret;
1423         int i = -1, err = 0;
1424
1425         compr_blocks = f2fs_compressed_blocks(cc);
1426         if (compr_blocks < 0) {
1427                 err = compr_blocks;
1428                 goto out_err;
1429         }
1430
1431         for (i = 0; i < cc->cluster_size; i++) {
1432                 if (!cc->rpages[i])
1433                         continue;
1434 retry_write:
1435                 if (cc->rpages[i]->mapping != mapping) {
1436                         unlock_page(cc->rpages[i]);
1437                         continue;
1438                 }
1439
1440                 BUG_ON(!PageLocked(cc->rpages[i]));
1441
1442                 ret = f2fs_write_single_data_page(cc->rpages[i], &_submitted,
1443                                                 NULL, NULL, wbc, io_type,
1444                                                 compr_blocks, false);
1445                 if (ret) {
1446                         if (ret == AOP_WRITEPAGE_ACTIVATE) {
1447                                 unlock_page(cc->rpages[i]);
1448                                 ret = 0;
1449                         } else if (ret == -EAGAIN) {
1450                                 /*
1451                                  * for quota file, just redirty left pages to
1452                                  * avoid deadlock caused by cluster update race
1453                                  * from foreground operation.
1454                                  */
1455                                 if (IS_NOQUOTA(cc->inode)) {
1456                                         err = 0;
1457                                         goto out_err;
1458                                 }
1459                                 ret = 0;
1460                                 cond_resched();
1461                                 congestion_wait(BLK_RW_ASYNC,
1462                                                 DEFAULT_IO_TIMEOUT);
1463                                 lock_page(cc->rpages[i]);
1464
1465                                 if (!PageDirty(cc->rpages[i])) {
1466                                         unlock_page(cc->rpages[i]);
1467                                         continue;
1468                                 }
1469
1470                                 clear_page_dirty_for_io(cc->rpages[i]);
1471                                 goto retry_write;
1472                         }
1473                         err = ret;
1474                         goto out_err;
1475                 }
1476
1477                 *submitted += _submitted;
1478         }
1479
1480         f2fs_balance_fs(F2FS_M_SB(mapping), true);
1481
1482         return 0;
1483 out_err:
1484         for (++i; i < cc->cluster_size; i++) {
1485                 if (!cc->rpages[i])
1486                         continue;
1487                 redirty_page_for_writepage(wbc, cc->rpages[i]);
1488                 unlock_page(cc->rpages[i]);
1489         }
1490         return err;
1491 }
1492
1493 int f2fs_write_multi_pages(struct compress_ctx *cc,
1494                                         int *submitted,
1495                                         struct writeback_control *wbc,
1496                                         enum iostat_type io_type)
1497 {
1498         int err;
1499
1500         *submitted = 0;
1501         if (cluster_may_compress(cc)) {
1502                 err = f2fs_compress_pages(cc);
1503                 if (err == -EAGAIN) {
1504                         goto write;
1505                 } else if (err) {
1506                         f2fs_put_rpages_wbc(cc, wbc, true, 1);
1507                         goto destroy_out;
1508                 }
1509
1510                 err = f2fs_write_compressed_pages(cc, submitted,
1511                                                         wbc, io_type);
1512                 if (!err)
1513                         return 0;
1514                 f2fs_bug_on(F2FS_I_SB(cc->inode), err != -EAGAIN);
1515         }
1516 write:
1517         f2fs_bug_on(F2FS_I_SB(cc->inode), *submitted);
1518
1519         err = f2fs_write_raw_pages(cc, submitted, wbc, io_type);
1520         f2fs_put_rpages_wbc(cc, wbc, false, 0);
1521 destroy_out:
1522         f2fs_destroy_compress_ctx(cc, false);
1523         return err;
1524 }
1525
1526 static void f2fs_free_dic(struct decompress_io_ctx *dic);
1527
1528 struct decompress_io_ctx *f2fs_alloc_dic(struct compress_ctx *cc)
1529 {
1530         struct decompress_io_ctx *dic;
1531         pgoff_t start_idx = start_idx_of_cluster(cc);
1532         int i;
1533
1534         dic = kmem_cache_zalloc(dic_entry_slab, GFP_NOFS);
1535         if (!dic)
1536                 return ERR_PTR(-ENOMEM);
1537
1538         dic->rpages = page_array_alloc(cc->inode, cc->cluster_size);
1539         if (!dic->rpages) {
1540                 kmem_cache_free(dic_entry_slab, dic);
1541                 return ERR_PTR(-ENOMEM);
1542         }
1543
1544         dic->magic = F2FS_COMPRESSED_PAGE_MAGIC;
1545         dic->inode = cc->inode;
1546         atomic_set(&dic->remaining_pages, cc->nr_cpages);
1547         dic->cluster_idx = cc->cluster_idx;
1548         dic->cluster_size = cc->cluster_size;
1549         dic->log_cluster_size = cc->log_cluster_size;
1550         dic->nr_cpages = cc->nr_cpages;
1551         refcount_set(&dic->refcnt, 1);
1552         dic->failed = false;
1553         dic->need_verity = f2fs_need_verity(cc->inode, start_idx);
1554
1555         for (i = 0; i < dic->cluster_size; i++)
1556                 dic->rpages[i] = cc->rpages[i];
1557         dic->nr_rpages = cc->cluster_size;
1558
1559         dic->cpages = page_array_alloc(dic->inode, dic->nr_cpages);
1560         if (!dic->cpages)
1561                 goto out_free;
1562
1563         for (i = 0; i < dic->nr_cpages; i++) {
1564                 struct page *page;
1565
1566                 page = f2fs_compress_alloc_page();
1567                 if (!page)
1568                         goto out_free;
1569
1570                 f2fs_set_compressed_page(page, cc->inode,
1571                                         start_idx + i + 1, dic);
1572                 dic->cpages[i] = page;
1573         }
1574
1575         return dic;
1576
1577 out_free:
1578         f2fs_free_dic(dic);
1579         return ERR_PTR(-ENOMEM);
1580 }
1581
1582 static void f2fs_free_dic(struct decompress_io_ctx *dic)
1583 {
1584         int i;
1585
1586         if (dic->tpages) {
1587                 for (i = 0; i < dic->cluster_size; i++) {
1588                         if (dic->rpages[i])
1589                                 continue;
1590                         if (!dic->tpages[i])
1591                                 continue;
1592                         f2fs_compress_free_page(dic->tpages[i]);
1593                 }
1594                 page_array_free(dic->inode, dic->tpages, dic->cluster_size);
1595         }
1596
1597         if (dic->cpages) {
1598                 for (i = 0; i < dic->nr_cpages; i++) {
1599                         if (!dic->cpages[i])
1600                                 continue;
1601                         f2fs_compress_free_page(dic->cpages[i]);
1602                 }
1603                 page_array_free(dic->inode, dic->cpages, dic->nr_cpages);
1604         }
1605
1606         page_array_free(dic->inode, dic->rpages, dic->nr_rpages);
1607         kmem_cache_free(dic_entry_slab, dic);
1608 }
1609
1610 static void f2fs_put_dic(struct decompress_io_ctx *dic)
1611 {
1612         if (refcount_dec_and_test(&dic->refcnt))
1613                 f2fs_free_dic(dic);
1614 }
1615
1616 /*
1617  * Update and unlock the cluster's pagecache pages, and release the reference to
1618  * the decompress_io_ctx that was being held for I/O completion.
1619  */
1620 static void __f2fs_decompress_end_io(struct decompress_io_ctx *dic, bool failed)
1621 {
1622         int i;
1623
1624         for (i = 0; i < dic->cluster_size; i++) {
1625                 struct page *rpage = dic->rpages[i];
1626
1627                 if (!rpage)
1628                         continue;
1629
1630                 /* PG_error was set if verity failed. */
1631                 if (failed || PageError(rpage)) {
1632                         ClearPageUptodate(rpage);
1633                         /* will re-read again later */
1634                         ClearPageError(rpage);
1635                 } else {
1636                         SetPageUptodate(rpage);
1637                 }
1638                 unlock_page(rpage);
1639         }
1640
1641         f2fs_put_dic(dic);
1642 }
1643
1644 static void f2fs_verify_cluster(struct work_struct *work)
1645 {
1646         struct decompress_io_ctx *dic =
1647                 container_of(work, struct decompress_io_ctx, verity_work);
1648         int i;
1649
1650         /* Verify the cluster's decompressed pages with fs-verity. */
1651         for (i = 0; i < dic->cluster_size; i++) {
1652                 struct page *rpage = dic->rpages[i];
1653
1654                 if (rpage && !fsverity_verify_page(rpage))
1655                         SetPageError(rpage);
1656         }
1657
1658         __f2fs_decompress_end_io(dic, false);
1659 }
1660
1661 /*
1662  * This is called when a compressed cluster has been decompressed
1663  * (or failed to be read and/or decompressed).
1664  */
1665 void f2fs_decompress_end_io(struct decompress_io_ctx *dic, bool failed)
1666 {
1667         if (!failed && dic->need_verity) {
1668                 /*
1669                  * Note that to avoid deadlocks, the verity work can't be done
1670                  * on the decompression workqueue.  This is because verifying
1671                  * the data pages can involve reading metadata pages from the
1672                  * file, and these metadata pages may be compressed.
1673                  */
1674                 INIT_WORK(&dic->verity_work, f2fs_verify_cluster);
1675                 fsverity_enqueue_verify_work(&dic->verity_work);
1676         } else {
1677                 __f2fs_decompress_end_io(dic, failed);
1678         }
1679 }
1680
1681 /*
1682  * Put a reference to a compressed page's decompress_io_ctx.
1683  *
1684  * This is called when the page is no longer needed and can be freed.
1685  */
1686 void f2fs_put_page_dic(struct page *page)
1687 {
1688         struct decompress_io_ctx *dic =
1689                         (struct decompress_io_ctx *)page_private(page);
1690
1691         f2fs_put_dic(dic);
1692 }
1693
1694 int f2fs_init_page_array_cache(struct f2fs_sb_info *sbi)
1695 {
1696         dev_t dev = sbi->sb->s_bdev->bd_dev;
1697         char slab_name[32];
1698
1699         sprintf(slab_name, "f2fs_page_array_entry-%u:%u", MAJOR(dev), MINOR(dev));
1700
1701         sbi->page_array_slab_size = sizeof(struct page *) <<
1702                                         F2FS_OPTION(sbi).compress_log_size;
1703
1704         sbi->page_array_slab = f2fs_kmem_cache_create(slab_name,
1705                                         sbi->page_array_slab_size);
1706         if (!sbi->page_array_slab)
1707                 return -ENOMEM;
1708         return 0;
1709 }
1710
1711 void f2fs_destroy_page_array_cache(struct f2fs_sb_info *sbi)
1712 {
1713         kmem_cache_destroy(sbi->page_array_slab);
1714 }
1715
1716 static int __init f2fs_init_cic_cache(void)
1717 {
1718         cic_entry_slab = f2fs_kmem_cache_create("f2fs_cic_entry",
1719                                         sizeof(struct compress_io_ctx));
1720         if (!cic_entry_slab)
1721                 return -ENOMEM;
1722         return 0;
1723 }
1724
1725 static void f2fs_destroy_cic_cache(void)
1726 {
1727         kmem_cache_destroy(cic_entry_slab);
1728 }
1729
1730 static int __init f2fs_init_dic_cache(void)
1731 {
1732         dic_entry_slab = f2fs_kmem_cache_create("f2fs_dic_entry",
1733                                         sizeof(struct decompress_io_ctx));
1734         if (!dic_entry_slab)
1735                 return -ENOMEM;
1736         return 0;
1737 }
1738
1739 static void f2fs_destroy_dic_cache(void)
1740 {
1741         kmem_cache_destroy(dic_entry_slab);
1742 }
1743
1744 int __init f2fs_init_compress_cache(void)
1745 {
1746         int err;
1747
1748         err = f2fs_init_cic_cache();
1749         if (err)
1750                 goto out;
1751         err = f2fs_init_dic_cache();
1752         if (err)
1753                 goto free_cic;
1754         return 0;
1755 free_cic:
1756         f2fs_destroy_cic_cache();
1757 out:
1758         return -ENOMEM;
1759 }
1760
1761 void f2fs_destroy_compress_cache(void)
1762 {
1763         f2fs_destroy_dic_cache();
1764         f2fs_destroy_cic_cache();
1765 }