Merge branch 'turbostat' of git://git.kernel.org/pub/scm/linux/kernel/git/lenb/linux
[linux-2.6-microblaze.git] / fs / f2fs / compress.c
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * f2fs compress support
4  *
5  * Copyright (c) 2019 Chao Yu <chao@kernel.org>
6  */
7
8 #include <linux/fs.h>
9 #include <linux/f2fs_fs.h>
10 #include <linux/writeback.h>
11 #include <linux/backing-dev.h>
12 #include <linux/lzo.h>
13 #include <linux/lz4.h>
14 #include <linux/zstd.h>
15
16 #include "f2fs.h"
17 #include "node.h"
18 #include <trace/events/f2fs.h>
19
20 static struct kmem_cache *cic_entry_slab;
21 static struct kmem_cache *dic_entry_slab;
22
23 static void *page_array_alloc(struct inode *inode, int nr)
24 {
25         struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
26         unsigned int size = sizeof(struct page *) * nr;
27
28         if (likely(size <= sbi->page_array_slab_size))
29                 return kmem_cache_zalloc(sbi->page_array_slab, GFP_NOFS);
30         return f2fs_kzalloc(sbi, size, GFP_NOFS);
31 }
32
33 static void page_array_free(struct inode *inode, void *pages, int nr)
34 {
35         struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
36         unsigned int size = sizeof(struct page *) * nr;
37
38         if (!pages)
39                 return;
40
41         if (likely(size <= sbi->page_array_slab_size))
42                 kmem_cache_free(sbi->page_array_slab, pages);
43         else
44                 kfree(pages);
45 }
46
47 struct f2fs_compress_ops {
48         int (*init_compress_ctx)(struct compress_ctx *cc);
49         void (*destroy_compress_ctx)(struct compress_ctx *cc);
50         int (*compress_pages)(struct compress_ctx *cc);
51         int (*init_decompress_ctx)(struct decompress_io_ctx *dic);
52         void (*destroy_decompress_ctx)(struct decompress_io_ctx *dic);
53         int (*decompress_pages)(struct decompress_io_ctx *dic);
54 };
55
56 static unsigned int offset_in_cluster(struct compress_ctx *cc, pgoff_t index)
57 {
58         return index & (cc->cluster_size - 1);
59 }
60
61 static pgoff_t cluster_idx(struct compress_ctx *cc, pgoff_t index)
62 {
63         return index >> cc->log_cluster_size;
64 }
65
66 static pgoff_t start_idx_of_cluster(struct compress_ctx *cc)
67 {
68         return cc->cluster_idx << cc->log_cluster_size;
69 }
70
71 bool f2fs_is_compressed_page(struct page *page)
72 {
73         if (!PagePrivate(page))
74                 return false;
75         if (!page_private(page))
76                 return false;
77         if (IS_ATOMIC_WRITTEN_PAGE(page) || IS_DUMMY_WRITTEN_PAGE(page))
78                 return false;
79
80         f2fs_bug_on(F2FS_M_SB(page->mapping),
81                 *((u32 *)page_private(page)) != F2FS_COMPRESSED_PAGE_MAGIC);
82         return true;
83 }
84
85 static void f2fs_set_compressed_page(struct page *page,
86                 struct inode *inode, pgoff_t index, void *data)
87 {
88         SetPagePrivate(page);
89         set_page_private(page, (unsigned long)data);
90
91         /* i_crypto_info and iv index */
92         page->index = index;
93         page->mapping = inode->i_mapping;
94 }
95
96 static void f2fs_drop_rpages(struct compress_ctx *cc, int len, bool unlock)
97 {
98         int i;
99
100         for (i = 0; i < len; i++) {
101                 if (!cc->rpages[i])
102                         continue;
103                 if (unlock)
104                         unlock_page(cc->rpages[i]);
105                 else
106                         put_page(cc->rpages[i]);
107         }
108 }
109
110 static void f2fs_put_rpages(struct compress_ctx *cc)
111 {
112         f2fs_drop_rpages(cc, cc->cluster_size, false);
113 }
114
115 static void f2fs_unlock_rpages(struct compress_ctx *cc, int len)
116 {
117         f2fs_drop_rpages(cc, len, true);
118 }
119
120 static void f2fs_put_rpages_mapping(struct address_space *mapping,
121                                 pgoff_t start, int len)
122 {
123         int i;
124
125         for (i = 0; i < len; i++) {
126                 struct page *page = find_get_page(mapping, start + i);
127
128                 put_page(page);
129                 put_page(page);
130         }
131 }
132
133 static void f2fs_put_rpages_wbc(struct compress_ctx *cc,
134                 struct writeback_control *wbc, bool redirty, int unlock)
135 {
136         unsigned int i;
137
138         for (i = 0; i < cc->cluster_size; i++) {
139                 if (!cc->rpages[i])
140                         continue;
141                 if (redirty)
142                         redirty_page_for_writepage(wbc, cc->rpages[i]);
143                 f2fs_put_page(cc->rpages[i], unlock);
144         }
145 }
146
147 struct page *f2fs_compress_control_page(struct page *page)
148 {
149         return ((struct compress_io_ctx *)page_private(page))->rpages[0];
150 }
151
152 int f2fs_init_compress_ctx(struct compress_ctx *cc)
153 {
154         if (cc->rpages)
155                 return 0;
156
157         cc->rpages = page_array_alloc(cc->inode, cc->cluster_size);
158         return cc->rpages ? 0 : -ENOMEM;
159 }
160
161 void f2fs_destroy_compress_ctx(struct compress_ctx *cc)
162 {
163         page_array_free(cc->inode, cc->rpages, cc->cluster_size);
164         cc->rpages = NULL;
165         cc->nr_rpages = 0;
166         cc->nr_cpages = 0;
167         cc->cluster_idx = NULL_CLUSTER;
168 }
169
170 void f2fs_compress_ctx_add_page(struct compress_ctx *cc, struct page *page)
171 {
172         unsigned int cluster_ofs;
173
174         if (!f2fs_cluster_can_merge_page(cc, page->index))
175                 f2fs_bug_on(F2FS_I_SB(cc->inode), 1);
176
177         cluster_ofs = offset_in_cluster(cc, page->index);
178         cc->rpages[cluster_ofs] = page;
179         cc->nr_rpages++;
180         cc->cluster_idx = cluster_idx(cc, page->index);
181 }
182
183 #ifdef CONFIG_F2FS_FS_LZO
184 static int lzo_init_compress_ctx(struct compress_ctx *cc)
185 {
186         cc->private = f2fs_kvmalloc(F2FS_I_SB(cc->inode),
187                                 LZO1X_MEM_COMPRESS, GFP_NOFS);
188         if (!cc->private)
189                 return -ENOMEM;
190
191         cc->clen = lzo1x_worst_compress(PAGE_SIZE << cc->log_cluster_size);
192         return 0;
193 }
194
195 static void lzo_destroy_compress_ctx(struct compress_ctx *cc)
196 {
197         kvfree(cc->private);
198         cc->private = NULL;
199 }
200
201 static int lzo_compress_pages(struct compress_ctx *cc)
202 {
203         int ret;
204
205         ret = lzo1x_1_compress(cc->rbuf, cc->rlen, cc->cbuf->cdata,
206                                         &cc->clen, cc->private);
207         if (ret != LZO_E_OK) {
208                 printk_ratelimited("%sF2FS-fs (%s): lzo compress failed, ret:%d\n",
209                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id, ret);
210                 return -EIO;
211         }
212         return 0;
213 }
214
215 static int lzo_decompress_pages(struct decompress_io_ctx *dic)
216 {
217         int ret;
218
219         ret = lzo1x_decompress_safe(dic->cbuf->cdata, dic->clen,
220                                                 dic->rbuf, &dic->rlen);
221         if (ret != LZO_E_OK) {
222                 printk_ratelimited("%sF2FS-fs (%s): lzo decompress failed, ret:%d\n",
223                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id, ret);
224                 return -EIO;
225         }
226
227         if (dic->rlen != PAGE_SIZE << dic->log_cluster_size) {
228                 printk_ratelimited("%sF2FS-fs (%s): lzo invalid rlen:%zu, "
229                                         "expected:%lu\n", KERN_ERR,
230                                         F2FS_I_SB(dic->inode)->sb->s_id,
231                                         dic->rlen,
232                                         PAGE_SIZE << dic->log_cluster_size);
233                 return -EIO;
234         }
235         return 0;
236 }
237
238 static const struct f2fs_compress_ops f2fs_lzo_ops = {
239         .init_compress_ctx      = lzo_init_compress_ctx,
240         .destroy_compress_ctx   = lzo_destroy_compress_ctx,
241         .compress_pages         = lzo_compress_pages,
242         .decompress_pages       = lzo_decompress_pages,
243 };
244 #endif
245
246 #ifdef CONFIG_F2FS_FS_LZ4
247 static int lz4_init_compress_ctx(struct compress_ctx *cc)
248 {
249         unsigned int size = LZ4_MEM_COMPRESS;
250
251 #ifdef CONFIG_F2FS_FS_LZ4HC
252         if (F2FS_I(cc->inode)->i_compress_flag >> COMPRESS_LEVEL_OFFSET)
253                 size = LZ4HC_MEM_COMPRESS;
254 #endif
255
256         cc->private = f2fs_kvmalloc(F2FS_I_SB(cc->inode), size, GFP_NOFS);
257         if (!cc->private)
258                 return -ENOMEM;
259
260         /*
261          * we do not change cc->clen to LZ4_compressBound(inputsize) to
262          * adapt worst compress case, because lz4 compressor can handle
263          * output budget properly.
264          */
265         cc->clen = cc->rlen - PAGE_SIZE - COMPRESS_HEADER_SIZE;
266         return 0;
267 }
268
269 static void lz4_destroy_compress_ctx(struct compress_ctx *cc)
270 {
271         kvfree(cc->private);
272         cc->private = NULL;
273 }
274
275 #ifdef CONFIG_F2FS_FS_LZ4HC
276 static int lz4hc_compress_pages(struct compress_ctx *cc)
277 {
278         unsigned char level = F2FS_I(cc->inode)->i_compress_flag >>
279                                                 COMPRESS_LEVEL_OFFSET;
280         int len;
281
282         if (level)
283                 len = LZ4_compress_HC(cc->rbuf, cc->cbuf->cdata, cc->rlen,
284                                         cc->clen, level, cc->private);
285         else
286                 len = LZ4_compress_default(cc->rbuf, cc->cbuf->cdata, cc->rlen,
287                                                 cc->clen, cc->private);
288         if (!len)
289                 return -EAGAIN;
290
291         cc->clen = len;
292         return 0;
293 }
294 #endif
295
296 static int lz4_compress_pages(struct compress_ctx *cc)
297 {
298         int len;
299
300 #ifdef CONFIG_F2FS_FS_LZ4HC
301         return lz4hc_compress_pages(cc);
302 #endif
303         len = LZ4_compress_default(cc->rbuf, cc->cbuf->cdata, cc->rlen,
304                                                 cc->clen, cc->private);
305         if (!len)
306                 return -EAGAIN;
307
308         cc->clen = len;
309         return 0;
310 }
311
312 static int lz4_decompress_pages(struct decompress_io_ctx *dic)
313 {
314         int ret;
315
316         ret = LZ4_decompress_safe(dic->cbuf->cdata, dic->rbuf,
317                                                 dic->clen, dic->rlen);
318         if (ret < 0) {
319                 printk_ratelimited("%sF2FS-fs (%s): lz4 decompress failed, ret:%d\n",
320                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id, ret);
321                 return -EIO;
322         }
323
324         if (ret != PAGE_SIZE << dic->log_cluster_size) {
325                 printk_ratelimited("%sF2FS-fs (%s): lz4 invalid rlen:%zu, "
326                                         "expected:%lu\n", KERN_ERR,
327                                         F2FS_I_SB(dic->inode)->sb->s_id,
328                                         dic->rlen,
329                                         PAGE_SIZE << dic->log_cluster_size);
330                 return -EIO;
331         }
332         return 0;
333 }
334
335 static const struct f2fs_compress_ops f2fs_lz4_ops = {
336         .init_compress_ctx      = lz4_init_compress_ctx,
337         .destroy_compress_ctx   = lz4_destroy_compress_ctx,
338         .compress_pages         = lz4_compress_pages,
339         .decompress_pages       = lz4_decompress_pages,
340 };
341 #endif
342
343 #ifdef CONFIG_F2FS_FS_ZSTD
344 #define F2FS_ZSTD_DEFAULT_CLEVEL        1
345
346 static int zstd_init_compress_ctx(struct compress_ctx *cc)
347 {
348         ZSTD_parameters params;
349         ZSTD_CStream *stream;
350         void *workspace;
351         unsigned int workspace_size;
352         unsigned char level = F2FS_I(cc->inode)->i_compress_flag >>
353                                                 COMPRESS_LEVEL_OFFSET;
354
355         if (!level)
356                 level = F2FS_ZSTD_DEFAULT_CLEVEL;
357
358         params = ZSTD_getParams(level, cc->rlen, 0);
359         workspace_size = ZSTD_CStreamWorkspaceBound(params.cParams);
360
361         workspace = f2fs_kvmalloc(F2FS_I_SB(cc->inode),
362                                         workspace_size, GFP_NOFS);
363         if (!workspace)
364                 return -ENOMEM;
365
366         stream = ZSTD_initCStream(params, 0, workspace, workspace_size);
367         if (!stream) {
368                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_initCStream failed\n",
369                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id,
370                                 __func__);
371                 kvfree(workspace);
372                 return -EIO;
373         }
374
375         cc->private = workspace;
376         cc->private2 = stream;
377
378         cc->clen = cc->rlen - PAGE_SIZE - COMPRESS_HEADER_SIZE;
379         return 0;
380 }
381
382 static void zstd_destroy_compress_ctx(struct compress_ctx *cc)
383 {
384         kvfree(cc->private);
385         cc->private = NULL;
386         cc->private2 = NULL;
387 }
388
389 static int zstd_compress_pages(struct compress_ctx *cc)
390 {
391         ZSTD_CStream *stream = cc->private2;
392         ZSTD_inBuffer inbuf;
393         ZSTD_outBuffer outbuf;
394         int src_size = cc->rlen;
395         int dst_size = src_size - PAGE_SIZE - COMPRESS_HEADER_SIZE;
396         int ret;
397
398         inbuf.pos = 0;
399         inbuf.src = cc->rbuf;
400         inbuf.size = src_size;
401
402         outbuf.pos = 0;
403         outbuf.dst = cc->cbuf->cdata;
404         outbuf.size = dst_size;
405
406         ret = ZSTD_compressStream(stream, &outbuf, &inbuf);
407         if (ZSTD_isError(ret)) {
408                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_compressStream failed, ret: %d\n",
409                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id,
410                                 __func__, ZSTD_getErrorCode(ret));
411                 return -EIO;
412         }
413
414         ret = ZSTD_endStream(stream, &outbuf);
415         if (ZSTD_isError(ret)) {
416                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_endStream returned %d\n",
417                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id,
418                                 __func__, ZSTD_getErrorCode(ret));
419                 return -EIO;
420         }
421
422         /*
423          * there is compressed data remained in intermediate buffer due to
424          * no more space in cbuf.cdata
425          */
426         if (ret)
427                 return -EAGAIN;
428
429         cc->clen = outbuf.pos;
430         return 0;
431 }
432
433 static int zstd_init_decompress_ctx(struct decompress_io_ctx *dic)
434 {
435         ZSTD_DStream *stream;
436         void *workspace;
437         unsigned int workspace_size;
438         unsigned int max_window_size =
439                         MAX_COMPRESS_WINDOW_SIZE(dic->log_cluster_size);
440
441         workspace_size = ZSTD_DStreamWorkspaceBound(max_window_size);
442
443         workspace = f2fs_kvmalloc(F2FS_I_SB(dic->inode),
444                                         workspace_size, GFP_NOFS);
445         if (!workspace)
446                 return -ENOMEM;
447
448         stream = ZSTD_initDStream(max_window_size, workspace, workspace_size);
449         if (!stream) {
450                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_initDStream failed\n",
451                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id,
452                                 __func__);
453                 kvfree(workspace);
454                 return -EIO;
455         }
456
457         dic->private = workspace;
458         dic->private2 = stream;
459
460         return 0;
461 }
462
463 static void zstd_destroy_decompress_ctx(struct decompress_io_ctx *dic)
464 {
465         kvfree(dic->private);
466         dic->private = NULL;
467         dic->private2 = NULL;
468 }
469
470 static int zstd_decompress_pages(struct decompress_io_ctx *dic)
471 {
472         ZSTD_DStream *stream = dic->private2;
473         ZSTD_inBuffer inbuf;
474         ZSTD_outBuffer outbuf;
475         int ret;
476
477         inbuf.pos = 0;
478         inbuf.src = dic->cbuf->cdata;
479         inbuf.size = dic->clen;
480
481         outbuf.pos = 0;
482         outbuf.dst = dic->rbuf;
483         outbuf.size = dic->rlen;
484
485         ret = ZSTD_decompressStream(stream, &outbuf, &inbuf);
486         if (ZSTD_isError(ret)) {
487                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_compressStream failed, ret: %d\n",
488                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id,
489                                 __func__, ZSTD_getErrorCode(ret));
490                 return -EIO;
491         }
492
493         if (dic->rlen != outbuf.pos) {
494                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD invalid rlen:%zu, "
495                                 "expected:%lu\n", KERN_ERR,
496                                 F2FS_I_SB(dic->inode)->sb->s_id,
497                                 __func__, dic->rlen,
498                                 PAGE_SIZE << dic->log_cluster_size);
499                 return -EIO;
500         }
501
502         return 0;
503 }
504
505 static const struct f2fs_compress_ops f2fs_zstd_ops = {
506         .init_compress_ctx      = zstd_init_compress_ctx,
507         .destroy_compress_ctx   = zstd_destroy_compress_ctx,
508         .compress_pages         = zstd_compress_pages,
509         .init_decompress_ctx    = zstd_init_decompress_ctx,
510         .destroy_decompress_ctx = zstd_destroy_decompress_ctx,
511         .decompress_pages       = zstd_decompress_pages,
512 };
513 #endif
514
515 #ifdef CONFIG_F2FS_FS_LZO
516 #ifdef CONFIG_F2FS_FS_LZORLE
517 static int lzorle_compress_pages(struct compress_ctx *cc)
518 {
519         int ret;
520
521         ret = lzorle1x_1_compress(cc->rbuf, cc->rlen, cc->cbuf->cdata,
522                                         &cc->clen, cc->private);
523         if (ret != LZO_E_OK) {
524                 printk_ratelimited("%sF2FS-fs (%s): lzo-rle compress failed, ret:%d\n",
525                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id, ret);
526                 return -EIO;
527         }
528         return 0;
529 }
530
531 static const struct f2fs_compress_ops f2fs_lzorle_ops = {
532         .init_compress_ctx      = lzo_init_compress_ctx,
533         .destroy_compress_ctx   = lzo_destroy_compress_ctx,
534         .compress_pages         = lzorle_compress_pages,
535         .decompress_pages       = lzo_decompress_pages,
536 };
537 #endif
538 #endif
539
540 static const struct f2fs_compress_ops *f2fs_cops[COMPRESS_MAX] = {
541 #ifdef CONFIG_F2FS_FS_LZO
542         &f2fs_lzo_ops,
543 #else
544         NULL,
545 #endif
546 #ifdef CONFIG_F2FS_FS_LZ4
547         &f2fs_lz4_ops,
548 #else
549         NULL,
550 #endif
551 #ifdef CONFIG_F2FS_FS_ZSTD
552         &f2fs_zstd_ops,
553 #else
554         NULL,
555 #endif
556 #if defined(CONFIG_F2FS_FS_LZO) && defined(CONFIG_F2FS_FS_LZORLE)
557         &f2fs_lzorle_ops,
558 #else
559         NULL,
560 #endif
561 };
562
563 bool f2fs_is_compress_backend_ready(struct inode *inode)
564 {
565         if (!f2fs_compressed_file(inode))
566                 return true;
567         return f2fs_cops[F2FS_I(inode)->i_compress_algorithm];
568 }
569
570 static mempool_t *compress_page_pool;
571 static int num_compress_pages = 512;
572 module_param(num_compress_pages, uint, 0444);
573 MODULE_PARM_DESC(num_compress_pages,
574                 "Number of intermediate compress pages to preallocate");
575
576 int f2fs_init_compress_mempool(void)
577 {
578         compress_page_pool = mempool_create_page_pool(num_compress_pages, 0);
579         if (!compress_page_pool)
580                 return -ENOMEM;
581
582         return 0;
583 }
584
585 void f2fs_destroy_compress_mempool(void)
586 {
587         mempool_destroy(compress_page_pool);
588 }
589
590 static struct page *f2fs_compress_alloc_page(void)
591 {
592         struct page *page;
593
594         page = mempool_alloc(compress_page_pool, GFP_NOFS);
595         lock_page(page);
596
597         return page;
598 }
599
600 static void f2fs_compress_free_page(struct page *page)
601 {
602         if (!page)
603                 return;
604         set_page_private(page, (unsigned long)NULL);
605         ClearPagePrivate(page);
606         page->mapping = NULL;
607         unlock_page(page);
608         mempool_free(page, compress_page_pool);
609 }
610
611 #define MAX_VMAP_RETRIES        3
612
613 static void *f2fs_vmap(struct page **pages, unsigned int count)
614 {
615         int i;
616         void *buf = NULL;
617
618         for (i = 0; i < MAX_VMAP_RETRIES; i++) {
619                 buf = vm_map_ram(pages, count, -1);
620                 if (buf)
621                         break;
622                 vm_unmap_aliases();
623         }
624         return buf;
625 }
626
627 static int f2fs_compress_pages(struct compress_ctx *cc)
628 {
629         struct f2fs_inode_info *fi = F2FS_I(cc->inode);
630         const struct f2fs_compress_ops *cops =
631                                 f2fs_cops[fi->i_compress_algorithm];
632         unsigned int max_len, new_nr_cpages;
633         struct page **new_cpages;
634         u32 chksum = 0;
635         int i, ret;
636
637         trace_f2fs_compress_pages_start(cc->inode, cc->cluster_idx,
638                                 cc->cluster_size, fi->i_compress_algorithm);
639
640         if (cops->init_compress_ctx) {
641                 ret = cops->init_compress_ctx(cc);
642                 if (ret)
643                         goto out;
644         }
645
646         max_len = COMPRESS_HEADER_SIZE + cc->clen;
647         cc->nr_cpages = DIV_ROUND_UP(max_len, PAGE_SIZE);
648
649         cc->cpages = page_array_alloc(cc->inode, cc->nr_cpages);
650         if (!cc->cpages) {
651                 ret = -ENOMEM;
652                 goto destroy_compress_ctx;
653         }
654
655         for (i = 0; i < cc->nr_cpages; i++) {
656                 cc->cpages[i] = f2fs_compress_alloc_page();
657                 if (!cc->cpages[i]) {
658                         ret = -ENOMEM;
659                         goto out_free_cpages;
660                 }
661         }
662
663         cc->rbuf = f2fs_vmap(cc->rpages, cc->cluster_size);
664         if (!cc->rbuf) {
665                 ret = -ENOMEM;
666                 goto out_free_cpages;
667         }
668
669         cc->cbuf = f2fs_vmap(cc->cpages, cc->nr_cpages);
670         if (!cc->cbuf) {
671                 ret = -ENOMEM;
672                 goto out_vunmap_rbuf;
673         }
674
675         ret = cops->compress_pages(cc);
676         if (ret)
677                 goto out_vunmap_cbuf;
678
679         max_len = PAGE_SIZE * (cc->cluster_size - 1) - COMPRESS_HEADER_SIZE;
680
681         if (cc->clen > max_len) {
682                 ret = -EAGAIN;
683                 goto out_vunmap_cbuf;
684         }
685
686         cc->cbuf->clen = cpu_to_le32(cc->clen);
687
688         if (fi->i_compress_flag & 1 << COMPRESS_CHKSUM)
689                 chksum = f2fs_crc32(F2FS_I_SB(cc->inode),
690                                         cc->cbuf->cdata, cc->clen);
691         cc->cbuf->chksum = cpu_to_le32(chksum);
692
693         for (i = 0; i < COMPRESS_DATA_RESERVED_SIZE; i++)
694                 cc->cbuf->reserved[i] = cpu_to_le32(0);
695
696         new_nr_cpages = DIV_ROUND_UP(cc->clen + COMPRESS_HEADER_SIZE, PAGE_SIZE);
697
698         /* Now we're going to cut unnecessary tail pages */
699         new_cpages = page_array_alloc(cc->inode, new_nr_cpages);
700         if (!new_cpages) {
701                 ret = -ENOMEM;
702                 goto out_vunmap_cbuf;
703         }
704
705         /* zero out any unused part of the last page */
706         memset(&cc->cbuf->cdata[cc->clen], 0,
707                         (new_nr_cpages * PAGE_SIZE) -
708                         (cc->clen + COMPRESS_HEADER_SIZE));
709
710         vm_unmap_ram(cc->cbuf, cc->nr_cpages);
711         vm_unmap_ram(cc->rbuf, cc->cluster_size);
712
713         for (i = 0; i < cc->nr_cpages; i++) {
714                 if (i < new_nr_cpages) {
715                         new_cpages[i] = cc->cpages[i];
716                         continue;
717                 }
718                 f2fs_compress_free_page(cc->cpages[i]);
719                 cc->cpages[i] = NULL;
720         }
721
722         if (cops->destroy_compress_ctx)
723                 cops->destroy_compress_ctx(cc);
724
725         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
726         cc->cpages = new_cpages;
727         cc->nr_cpages = new_nr_cpages;
728
729         trace_f2fs_compress_pages_end(cc->inode, cc->cluster_idx,
730                                                         cc->clen, ret);
731         return 0;
732
733 out_vunmap_cbuf:
734         vm_unmap_ram(cc->cbuf, cc->nr_cpages);
735 out_vunmap_rbuf:
736         vm_unmap_ram(cc->rbuf, cc->cluster_size);
737 out_free_cpages:
738         for (i = 0; i < cc->nr_cpages; i++) {
739                 if (cc->cpages[i])
740                         f2fs_compress_free_page(cc->cpages[i]);
741         }
742         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
743         cc->cpages = NULL;
744 destroy_compress_ctx:
745         if (cops->destroy_compress_ctx)
746                 cops->destroy_compress_ctx(cc);
747 out:
748         trace_f2fs_compress_pages_end(cc->inode, cc->cluster_idx,
749                                                         cc->clen, ret);
750         return ret;
751 }
752
753 static void f2fs_decompress_cluster(struct decompress_io_ctx *dic)
754 {
755         struct f2fs_sb_info *sbi = F2FS_I_SB(dic->inode);
756         struct f2fs_inode_info *fi = F2FS_I(dic->inode);
757         const struct f2fs_compress_ops *cops =
758                         f2fs_cops[fi->i_compress_algorithm];
759         int ret;
760         int i;
761
762         trace_f2fs_decompress_pages_start(dic->inode, dic->cluster_idx,
763                                 dic->cluster_size, fi->i_compress_algorithm);
764
765         if (dic->failed) {
766                 ret = -EIO;
767                 goto out_end_io;
768         }
769
770         dic->tpages = page_array_alloc(dic->inode, dic->cluster_size);
771         if (!dic->tpages) {
772                 ret = -ENOMEM;
773                 goto out_end_io;
774         }
775
776         for (i = 0; i < dic->cluster_size; i++) {
777                 if (dic->rpages[i]) {
778                         dic->tpages[i] = dic->rpages[i];
779                         continue;
780                 }
781
782                 dic->tpages[i] = f2fs_compress_alloc_page();
783                 if (!dic->tpages[i]) {
784                         ret = -ENOMEM;
785                         goto out_end_io;
786                 }
787         }
788
789         if (cops->init_decompress_ctx) {
790                 ret = cops->init_decompress_ctx(dic);
791                 if (ret)
792                         goto out_end_io;
793         }
794
795         dic->rbuf = f2fs_vmap(dic->tpages, dic->cluster_size);
796         if (!dic->rbuf) {
797                 ret = -ENOMEM;
798                 goto out_destroy_decompress_ctx;
799         }
800
801         dic->cbuf = f2fs_vmap(dic->cpages, dic->nr_cpages);
802         if (!dic->cbuf) {
803                 ret = -ENOMEM;
804                 goto out_vunmap_rbuf;
805         }
806
807         dic->clen = le32_to_cpu(dic->cbuf->clen);
808         dic->rlen = PAGE_SIZE << dic->log_cluster_size;
809
810         if (dic->clen > PAGE_SIZE * dic->nr_cpages - COMPRESS_HEADER_SIZE) {
811                 ret = -EFSCORRUPTED;
812                 goto out_vunmap_cbuf;
813         }
814
815         ret = cops->decompress_pages(dic);
816
817         if (!ret && (fi->i_compress_flag & 1 << COMPRESS_CHKSUM)) {
818                 u32 provided = le32_to_cpu(dic->cbuf->chksum);
819                 u32 calculated = f2fs_crc32(sbi, dic->cbuf->cdata, dic->clen);
820
821                 if (provided != calculated) {
822                         if (!is_inode_flag_set(dic->inode, FI_COMPRESS_CORRUPT)) {
823                                 set_inode_flag(dic->inode, FI_COMPRESS_CORRUPT);
824                                 printk_ratelimited(
825                                         "%sF2FS-fs (%s): checksum invalid, nid = %lu, %x vs %x",
826                                         KERN_INFO, sbi->sb->s_id, dic->inode->i_ino,
827                                         provided, calculated);
828                         }
829                         set_sbi_flag(sbi, SBI_NEED_FSCK);
830                 }
831         }
832
833 out_vunmap_cbuf:
834         vm_unmap_ram(dic->cbuf, dic->nr_cpages);
835 out_vunmap_rbuf:
836         vm_unmap_ram(dic->rbuf, dic->cluster_size);
837 out_destroy_decompress_ctx:
838         if (cops->destroy_decompress_ctx)
839                 cops->destroy_decompress_ctx(dic);
840 out_end_io:
841         trace_f2fs_decompress_pages_end(dic->inode, dic->cluster_idx,
842                                                         dic->clen, ret);
843         f2fs_decompress_end_io(dic, ret);
844 }
845
846 /*
847  * This is called when a page of a compressed cluster has been read from disk
848  * (or failed to be read from disk).  It checks whether this page was the last
849  * page being waited on in the cluster, and if so, it decompresses the cluster
850  * (or in the case of a failure, cleans up without actually decompressing).
851  */
852 void f2fs_end_read_compressed_page(struct page *page, bool failed)
853 {
854         struct decompress_io_ctx *dic =
855                         (struct decompress_io_ctx *)page_private(page);
856         struct f2fs_sb_info *sbi = F2FS_I_SB(dic->inode);
857
858         dec_page_count(sbi, F2FS_RD_DATA);
859
860         if (failed)
861                 WRITE_ONCE(dic->failed, true);
862
863         if (atomic_dec_and_test(&dic->remaining_pages))
864                 f2fs_decompress_cluster(dic);
865 }
866
867 static bool is_page_in_cluster(struct compress_ctx *cc, pgoff_t index)
868 {
869         if (cc->cluster_idx == NULL_CLUSTER)
870                 return true;
871         return cc->cluster_idx == cluster_idx(cc, index);
872 }
873
874 bool f2fs_cluster_is_empty(struct compress_ctx *cc)
875 {
876         return cc->nr_rpages == 0;
877 }
878
879 static bool f2fs_cluster_is_full(struct compress_ctx *cc)
880 {
881         return cc->cluster_size == cc->nr_rpages;
882 }
883
884 bool f2fs_cluster_can_merge_page(struct compress_ctx *cc, pgoff_t index)
885 {
886         if (f2fs_cluster_is_empty(cc))
887                 return true;
888         return is_page_in_cluster(cc, index);
889 }
890
891 static bool __cluster_may_compress(struct compress_ctx *cc)
892 {
893         loff_t i_size = i_size_read(cc->inode);
894         unsigned nr_pages = DIV_ROUND_UP(i_size, PAGE_SIZE);
895         int i;
896
897         for (i = 0; i < cc->cluster_size; i++) {
898                 struct page *page = cc->rpages[i];
899
900                 f2fs_bug_on(F2FS_I_SB(cc->inode), !page);
901
902                 /* beyond EOF */
903                 if (page->index >= nr_pages)
904                         return false;
905         }
906         return true;
907 }
908
909 static int __f2fs_cluster_blocks(struct compress_ctx *cc, bool compr)
910 {
911         struct dnode_of_data dn;
912         int ret;
913
914         set_new_dnode(&dn, cc->inode, NULL, NULL, 0);
915         ret = f2fs_get_dnode_of_data(&dn, start_idx_of_cluster(cc),
916                                                         LOOKUP_NODE);
917         if (ret) {
918                 if (ret == -ENOENT)
919                         ret = 0;
920                 goto fail;
921         }
922
923         if (dn.data_blkaddr == COMPRESS_ADDR) {
924                 int i;
925
926                 ret = 1;
927                 for (i = 1; i < cc->cluster_size; i++) {
928                         block_t blkaddr;
929
930                         blkaddr = data_blkaddr(dn.inode,
931                                         dn.node_page, dn.ofs_in_node + i);
932                         if (compr) {
933                                 if (__is_valid_data_blkaddr(blkaddr))
934                                         ret++;
935                         } else {
936                                 if (blkaddr != NULL_ADDR)
937                                         ret++;
938                         }
939                 }
940         }
941 fail:
942         f2fs_put_dnode(&dn);
943         return ret;
944 }
945
946 /* return # of compressed blocks in compressed cluster */
947 static int f2fs_compressed_blocks(struct compress_ctx *cc)
948 {
949         return __f2fs_cluster_blocks(cc, true);
950 }
951
952 /* return # of valid blocks in compressed cluster */
953 static int f2fs_cluster_blocks(struct compress_ctx *cc)
954 {
955         return __f2fs_cluster_blocks(cc, false);
956 }
957
958 int f2fs_is_compressed_cluster(struct inode *inode, pgoff_t index)
959 {
960         struct compress_ctx cc = {
961                 .inode = inode,
962                 .log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
963                 .cluster_size = F2FS_I(inode)->i_cluster_size,
964                 .cluster_idx = index >> F2FS_I(inode)->i_log_cluster_size,
965         };
966
967         return f2fs_cluster_blocks(&cc);
968 }
969
970 static bool cluster_may_compress(struct compress_ctx *cc)
971 {
972         if (!f2fs_need_compress_data(cc->inode))
973                 return false;
974         if (f2fs_is_atomic_file(cc->inode))
975                 return false;
976         if (f2fs_is_mmap_file(cc->inode))
977                 return false;
978         if (!f2fs_cluster_is_full(cc))
979                 return false;
980         if (unlikely(f2fs_cp_error(F2FS_I_SB(cc->inode))))
981                 return false;
982         return __cluster_may_compress(cc);
983 }
984
985 static void set_cluster_writeback(struct compress_ctx *cc)
986 {
987         int i;
988
989         for (i = 0; i < cc->cluster_size; i++) {
990                 if (cc->rpages[i])
991                         set_page_writeback(cc->rpages[i]);
992         }
993 }
994
995 static void set_cluster_dirty(struct compress_ctx *cc)
996 {
997         int i;
998
999         for (i = 0; i < cc->cluster_size; i++)
1000                 if (cc->rpages[i])
1001                         set_page_dirty(cc->rpages[i]);
1002 }
1003
1004 static int prepare_compress_overwrite(struct compress_ctx *cc,
1005                 struct page **pagep, pgoff_t index, void **fsdata)
1006 {
1007         struct f2fs_sb_info *sbi = F2FS_I_SB(cc->inode);
1008         struct address_space *mapping = cc->inode->i_mapping;
1009         struct page *page;
1010         struct dnode_of_data dn;
1011         sector_t last_block_in_bio;
1012         unsigned fgp_flag = FGP_LOCK | FGP_WRITE | FGP_CREAT;
1013         pgoff_t start_idx = start_idx_of_cluster(cc);
1014         int i, ret;
1015         bool prealloc;
1016
1017 retry:
1018         ret = f2fs_cluster_blocks(cc);
1019         if (ret <= 0)
1020                 return ret;
1021
1022         /* compressed case */
1023         prealloc = (ret < cc->cluster_size);
1024
1025         ret = f2fs_init_compress_ctx(cc);
1026         if (ret)
1027                 return ret;
1028
1029         /* keep page reference to avoid page reclaim */
1030         for (i = 0; i < cc->cluster_size; i++) {
1031                 page = f2fs_pagecache_get_page(mapping, start_idx + i,
1032                                                         fgp_flag, GFP_NOFS);
1033                 if (!page) {
1034                         ret = -ENOMEM;
1035                         goto unlock_pages;
1036                 }
1037
1038                 if (PageUptodate(page))
1039                         unlock_page(page);
1040                 else
1041                         f2fs_compress_ctx_add_page(cc, page);
1042         }
1043
1044         if (!f2fs_cluster_is_empty(cc)) {
1045                 struct bio *bio = NULL;
1046
1047                 ret = f2fs_read_multi_pages(cc, &bio, cc->cluster_size,
1048                                         &last_block_in_bio, false, true);
1049                 f2fs_destroy_compress_ctx(cc);
1050                 if (ret)
1051                         goto release_pages;
1052                 if (bio)
1053                         f2fs_submit_bio(sbi, bio, DATA);
1054
1055                 ret = f2fs_init_compress_ctx(cc);
1056                 if (ret)
1057                         goto release_pages;
1058         }
1059
1060         for (i = 0; i < cc->cluster_size; i++) {
1061                 f2fs_bug_on(sbi, cc->rpages[i]);
1062
1063                 page = find_lock_page(mapping, start_idx + i);
1064                 f2fs_bug_on(sbi, !page);
1065
1066                 f2fs_wait_on_page_writeback(page, DATA, true, true);
1067
1068                 f2fs_compress_ctx_add_page(cc, page);
1069                 f2fs_put_page(page, 0);
1070
1071                 if (!PageUptodate(page)) {
1072                         f2fs_unlock_rpages(cc, i + 1);
1073                         f2fs_put_rpages_mapping(mapping, start_idx,
1074                                         cc->cluster_size);
1075                         f2fs_destroy_compress_ctx(cc);
1076                         goto retry;
1077                 }
1078         }
1079
1080         if (prealloc) {
1081                 f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, true);
1082
1083                 set_new_dnode(&dn, cc->inode, NULL, NULL, 0);
1084
1085                 for (i = cc->cluster_size - 1; i > 0; i--) {
1086                         ret = f2fs_get_block(&dn, start_idx + i);
1087                         if (ret) {
1088                                 i = cc->cluster_size;
1089                                 break;
1090                         }
1091
1092                         if (dn.data_blkaddr != NEW_ADDR)
1093                                 break;
1094                 }
1095
1096                 f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, false);
1097         }
1098
1099         if (likely(!ret)) {
1100                 *fsdata = cc->rpages;
1101                 *pagep = cc->rpages[offset_in_cluster(cc, index)];
1102                 return cc->cluster_size;
1103         }
1104
1105 unlock_pages:
1106         f2fs_unlock_rpages(cc, i);
1107 release_pages:
1108         f2fs_put_rpages_mapping(mapping, start_idx, i);
1109         f2fs_destroy_compress_ctx(cc);
1110         return ret;
1111 }
1112
1113 int f2fs_prepare_compress_overwrite(struct inode *inode,
1114                 struct page **pagep, pgoff_t index, void **fsdata)
1115 {
1116         struct compress_ctx cc = {
1117                 .inode = inode,
1118                 .log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
1119                 .cluster_size = F2FS_I(inode)->i_cluster_size,
1120                 .cluster_idx = index >> F2FS_I(inode)->i_log_cluster_size,
1121                 .rpages = NULL,
1122                 .nr_rpages = 0,
1123         };
1124
1125         return prepare_compress_overwrite(&cc, pagep, index, fsdata);
1126 }
1127
1128 bool f2fs_compress_write_end(struct inode *inode, void *fsdata,
1129                                         pgoff_t index, unsigned copied)
1130
1131 {
1132         struct compress_ctx cc = {
1133                 .inode = inode,
1134                 .log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
1135                 .cluster_size = F2FS_I(inode)->i_cluster_size,
1136                 .rpages = fsdata,
1137         };
1138         bool first_index = (index == cc.rpages[0]->index);
1139
1140         if (copied)
1141                 set_cluster_dirty(&cc);
1142
1143         f2fs_put_rpages_wbc(&cc, NULL, false, 1);
1144         f2fs_destroy_compress_ctx(&cc);
1145
1146         return first_index;
1147 }
1148
1149 int f2fs_truncate_partial_cluster(struct inode *inode, u64 from, bool lock)
1150 {
1151         void *fsdata = NULL;
1152         struct page *pagep;
1153         int log_cluster_size = F2FS_I(inode)->i_log_cluster_size;
1154         pgoff_t start_idx = from >> (PAGE_SHIFT + log_cluster_size) <<
1155                                                         log_cluster_size;
1156         int err;
1157
1158         err = f2fs_is_compressed_cluster(inode, start_idx);
1159         if (err < 0)
1160                 return err;
1161
1162         /* truncate normal cluster */
1163         if (!err)
1164                 return f2fs_do_truncate_blocks(inode, from, lock);
1165
1166         /* truncate compressed cluster */
1167         err = f2fs_prepare_compress_overwrite(inode, &pagep,
1168                                                 start_idx, &fsdata);
1169
1170         /* should not be a normal cluster */
1171         f2fs_bug_on(F2FS_I_SB(inode), err == 0);
1172
1173         if (err <= 0)
1174                 return err;
1175
1176         if (err > 0) {
1177                 struct page **rpages = fsdata;
1178                 int cluster_size = F2FS_I(inode)->i_cluster_size;
1179                 int i;
1180
1181                 for (i = cluster_size - 1; i >= 0; i--) {
1182                         loff_t start = rpages[i]->index << PAGE_SHIFT;
1183
1184                         if (from <= start) {
1185                                 zero_user_segment(rpages[i], 0, PAGE_SIZE);
1186                         } else {
1187                                 zero_user_segment(rpages[i], from - start,
1188                                                                 PAGE_SIZE);
1189                                 break;
1190                         }
1191                 }
1192
1193                 f2fs_compress_write_end(inode, fsdata, start_idx, true);
1194         }
1195         return 0;
1196 }
1197
1198 static int f2fs_write_compressed_pages(struct compress_ctx *cc,
1199                                         int *submitted,
1200                                         struct writeback_control *wbc,
1201                                         enum iostat_type io_type)
1202 {
1203         struct inode *inode = cc->inode;
1204         struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1205         struct f2fs_inode_info *fi = F2FS_I(inode);
1206         struct f2fs_io_info fio = {
1207                 .sbi = sbi,
1208                 .ino = cc->inode->i_ino,
1209                 .type = DATA,
1210                 .op = REQ_OP_WRITE,
1211                 .op_flags = wbc_to_write_flags(wbc),
1212                 .old_blkaddr = NEW_ADDR,
1213                 .page = NULL,
1214                 .encrypted_page = NULL,
1215                 .compressed_page = NULL,
1216                 .submitted = false,
1217                 .io_type = io_type,
1218                 .io_wbc = wbc,
1219                 .encrypted = fscrypt_inode_uses_fs_layer_crypto(cc->inode),
1220         };
1221         struct dnode_of_data dn;
1222         struct node_info ni;
1223         struct compress_io_ctx *cic;
1224         pgoff_t start_idx = start_idx_of_cluster(cc);
1225         unsigned int last_index = cc->cluster_size - 1;
1226         loff_t psize;
1227         int i, err;
1228
1229         if (IS_NOQUOTA(inode)) {
1230                 /*
1231                  * We need to wait for node_write to avoid block allocation during
1232                  * checkpoint. This can only happen to quota writes which can cause
1233                  * the below discard race condition.
1234                  */
1235                 down_read(&sbi->node_write);
1236         } else if (!f2fs_trylock_op(sbi)) {
1237                 goto out_free;
1238         }
1239
1240         set_new_dnode(&dn, cc->inode, NULL, NULL, 0);
1241
1242         err = f2fs_get_dnode_of_data(&dn, start_idx, LOOKUP_NODE);
1243         if (err)
1244                 goto out_unlock_op;
1245
1246         for (i = 0; i < cc->cluster_size; i++) {
1247                 if (data_blkaddr(dn.inode, dn.node_page,
1248                                         dn.ofs_in_node + i) == NULL_ADDR)
1249                         goto out_put_dnode;
1250         }
1251
1252         psize = (loff_t)(cc->rpages[last_index]->index + 1) << PAGE_SHIFT;
1253
1254         err = f2fs_get_node_info(fio.sbi, dn.nid, &ni);
1255         if (err)
1256                 goto out_put_dnode;
1257
1258         fio.version = ni.version;
1259
1260         cic = kmem_cache_zalloc(cic_entry_slab, GFP_NOFS);
1261         if (!cic)
1262                 goto out_put_dnode;
1263
1264         cic->magic = F2FS_COMPRESSED_PAGE_MAGIC;
1265         cic->inode = inode;
1266         atomic_set(&cic->pending_pages, cc->nr_cpages);
1267         cic->rpages = page_array_alloc(cc->inode, cc->cluster_size);
1268         if (!cic->rpages)
1269                 goto out_put_cic;
1270
1271         cic->nr_rpages = cc->cluster_size;
1272
1273         for (i = 0; i < cc->nr_cpages; i++) {
1274                 f2fs_set_compressed_page(cc->cpages[i], inode,
1275                                         cc->rpages[i + 1]->index, cic);
1276                 fio.compressed_page = cc->cpages[i];
1277
1278                 fio.old_blkaddr = data_blkaddr(dn.inode, dn.node_page,
1279                                                 dn.ofs_in_node + i + 1);
1280
1281                 /* wait for GCed page writeback via META_MAPPING */
1282                 f2fs_wait_on_block_writeback(inode, fio.old_blkaddr);
1283
1284                 if (fio.encrypted) {
1285                         fio.page = cc->rpages[i + 1];
1286                         err = f2fs_encrypt_one_page(&fio);
1287                         if (err)
1288                                 goto out_destroy_crypt;
1289                         cc->cpages[i] = fio.encrypted_page;
1290                 }
1291         }
1292
1293         set_cluster_writeback(cc);
1294
1295         for (i = 0; i < cc->cluster_size; i++)
1296                 cic->rpages[i] = cc->rpages[i];
1297
1298         for (i = 0; i < cc->cluster_size; i++, dn.ofs_in_node++) {
1299                 block_t blkaddr;
1300
1301                 blkaddr = f2fs_data_blkaddr(&dn);
1302                 fio.page = cc->rpages[i];
1303                 fio.old_blkaddr = blkaddr;
1304
1305                 /* cluster header */
1306                 if (i == 0) {
1307                         if (blkaddr == COMPRESS_ADDR)
1308                                 fio.compr_blocks++;
1309                         if (__is_valid_data_blkaddr(blkaddr))
1310                                 f2fs_invalidate_blocks(sbi, blkaddr);
1311                         f2fs_update_data_blkaddr(&dn, COMPRESS_ADDR);
1312                         goto unlock_continue;
1313                 }
1314
1315                 if (fio.compr_blocks && __is_valid_data_blkaddr(blkaddr))
1316                         fio.compr_blocks++;
1317
1318                 if (i > cc->nr_cpages) {
1319                         if (__is_valid_data_blkaddr(blkaddr)) {
1320                                 f2fs_invalidate_blocks(sbi, blkaddr);
1321                                 f2fs_update_data_blkaddr(&dn, NEW_ADDR);
1322                         }
1323                         goto unlock_continue;
1324                 }
1325
1326                 f2fs_bug_on(fio.sbi, blkaddr == NULL_ADDR);
1327
1328                 if (fio.encrypted)
1329                         fio.encrypted_page = cc->cpages[i - 1];
1330                 else
1331                         fio.compressed_page = cc->cpages[i - 1];
1332
1333                 cc->cpages[i - 1] = NULL;
1334                 f2fs_outplace_write_data(&dn, &fio);
1335                 (*submitted)++;
1336 unlock_continue:
1337                 inode_dec_dirty_pages(cc->inode);
1338                 unlock_page(fio.page);
1339         }
1340
1341         if (fio.compr_blocks)
1342                 f2fs_i_compr_blocks_update(inode, fio.compr_blocks - 1, false);
1343         f2fs_i_compr_blocks_update(inode, cc->nr_cpages, true);
1344         add_compr_block_stat(inode, cc->nr_cpages);
1345
1346         set_inode_flag(cc->inode, FI_APPEND_WRITE);
1347         if (cc->cluster_idx == 0)
1348                 set_inode_flag(inode, FI_FIRST_BLOCK_WRITTEN);
1349
1350         f2fs_put_dnode(&dn);
1351         if (IS_NOQUOTA(inode))
1352                 up_read(&sbi->node_write);
1353         else
1354                 f2fs_unlock_op(sbi);
1355
1356         spin_lock(&fi->i_size_lock);
1357         if (fi->last_disk_size < psize)
1358                 fi->last_disk_size = psize;
1359         spin_unlock(&fi->i_size_lock);
1360
1361         f2fs_put_rpages(cc);
1362         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
1363         cc->cpages = NULL;
1364         f2fs_destroy_compress_ctx(cc);
1365         return 0;
1366
1367 out_destroy_crypt:
1368         page_array_free(cc->inode, cic->rpages, cc->cluster_size);
1369
1370         for (--i; i >= 0; i--)
1371                 fscrypt_finalize_bounce_page(&cc->cpages[i]);
1372         for (i = 0; i < cc->nr_cpages; i++) {
1373                 if (!cc->cpages[i])
1374                         continue;
1375                 f2fs_put_page(cc->cpages[i], 1);
1376         }
1377 out_put_cic:
1378         kmem_cache_free(cic_entry_slab, cic);
1379 out_put_dnode:
1380         f2fs_put_dnode(&dn);
1381 out_unlock_op:
1382         if (IS_NOQUOTA(inode))
1383                 up_read(&sbi->node_write);
1384         else
1385                 f2fs_unlock_op(sbi);
1386 out_free:
1387         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
1388         cc->cpages = NULL;
1389         return -EAGAIN;
1390 }
1391
1392 void f2fs_compress_write_end_io(struct bio *bio, struct page *page)
1393 {
1394         struct f2fs_sb_info *sbi = bio->bi_private;
1395         struct compress_io_ctx *cic =
1396                         (struct compress_io_ctx *)page_private(page);
1397         int i;
1398
1399         if (unlikely(bio->bi_status))
1400                 mapping_set_error(cic->inode->i_mapping, -EIO);
1401
1402         f2fs_compress_free_page(page);
1403
1404         dec_page_count(sbi, F2FS_WB_DATA);
1405
1406         if (atomic_dec_return(&cic->pending_pages))
1407                 return;
1408
1409         for (i = 0; i < cic->nr_rpages; i++) {
1410                 WARN_ON(!cic->rpages[i]);
1411                 clear_cold_data(cic->rpages[i]);
1412                 end_page_writeback(cic->rpages[i]);
1413         }
1414
1415         page_array_free(cic->inode, cic->rpages, cic->nr_rpages);
1416         kmem_cache_free(cic_entry_slab, cic);
1417 }
1418
1419 static int f2fs_write_raw_pages(struct compress_ctx *cc,
1420                                         int *submitted,
1421                                         struct writeback_control *wbc,
1422                                         enum iostat_type io_type)
1423 {
1424         struct address_space *mapping = cc->inode->i_mapping;
1425         int _submitted, compr_blocks, ret;
1426         int i = -1, err = 0;
1427
1428         compr_blocks = f2fs_compressed_blocks(cc);
1429         if (compr_blocks < 0) {
1430                 err = compr_blocks;
1431                 goto out_err;
1432         }
1433
1434         for (i = 0; i < cc->cluster_size; i++) {
1435                 if (!cc->rpages[i])
1436                         continue;
1437 retry_write:
1438                 if (cc->rpages[i]->mapping != mapping) {
1439                         unlock_page(cc->rpages[i]);
1440                         continue;
1441                 }
1442
1443                 BUG_ON(!PageLocked(cc->rpages[i]));
1444
1445                 ret = f2fs_write_single_data_page(cc->rpages[i], &_submitted,
1446                                                 NULL, NULL, wbc, io_type,
1447                                                 compr_blocks, false);
1448                 if (ret) {
1449                         if (ret == AOP_WRITEPAGE_ACTIVATE) {
1450                                 unlock_page(cc->rpages[i]);
1451                                 ret = 0;
1452                         } else if (ret == -EAGAIN) {
1453                                 /*
1454                                  * for quota file, just redirty left pages to
1455                                  * avoid deadlock caused by cluster update race
1456                                  * from foreground operation.
1457                                  */
1458                                 if (IS_NOQUOTA(cc->inode)) {
1459                                         err = 0;
1460                                         goto out_err;
1461                                 }
1462                                 ret = 0;
1463                                 cond_resched();
1464                                 congestion_wait(BLK_RW_ASYNC,
1465                                                 DEFAULT_IO_TIMEOUT);
1466                                 lock_page(cc->rpages[i]);
1467
1468                                 if (!PageDirty(cc->rpages[i])) {
1469                                         unlock_page(cc->rpages[i]);
1470                                         continue;
1471                                 }
1472
1473                                 clear_page_dirty_for_io(cc->rpages[i]);
1474                                 goto retry_write;
1475                         }
1476                         err = ret;
1477                         goto out_err;
1478                 }
1479
1480                 *submitted += _submitted;
1481         }
1482
1483         f2fs_balance_fs(F2FS_M_SB(mapping), true);
1484
1485         return 0;
1486 out_err:
1487         for (++i; i < cc->cluster_size; i++) {
1488                 if (!cc->rpages[i])
1489                         continue;
1490                 redirty_page_for_writepage(wbc, cc->rpages[i]);
1491                 unlock_page(cc->rpages[i]);
1492         }
1493         return err;
1494 }
1495
1496 int f2fs_write_multi_pages(struct compress_ctx *cc,
1497                                         int *submitted,
1498                                         struct writeback_control *wbc,
1499                                         enum iostat_type io_type)
1500 {
1501         int err;
1502
1503         *submitted = 0;
1504         if (cluster_may_compress(cc)) {
1505                 err = f2fs_compress_pages(cc);
1506                 if (err == -EAGAIN) {
1507                         goto write;
1508                 } else if (err) {
1509                         f2fs_put_rpages_wbc(cc, wbc, true, 1);
1510                         goto destroy_out;
1511                 }
1512
1513                 err = f2fs_write_compressed_pages(cc, submitted,
1514                                                         wbc, io_type);
1515                 if (!err)
1516                         return 0;
1517                 f2fs_bug_on(F2FS_I_SB(cc->inode), err != -EAGAIN);
1518         }
1519 write:
1520         f2fs_bug_on(F2FS_I_SB(cc->inode), *submitted);
1521
1522         err = f2fs_write_raw_pages(cc, submitted, wbc, io_type);
1523         f2fs_put_rpages_wbc(cc, wbc, false, 0);
1524 destroy_out:
1525         f2fs_destroy_compress_ctx(cc);
1526         return err;
1527 }
1528
1529 static void f2fs_free_dic(struct decompress_io_ctx *dic);
1530
1531 struct decompress_io_ctx *f2fs_alloc_dic(struct compress_ctx *cc)
1532 {
1533         struct decompress_io_ctx *dic;
1534         pgoff_t start_idx = start_idx_of_cluster(cc);
1535         int i;
1536
1537         dic = kmem_cache_zalloc(dic_entry_slab, GFP_NOFS);
1538         if (!dic)
1539                 return ERR_PTR(-ENOMEM);
1540
1541         dic->rpages = page_array_alloc(cc->inode, cc->cluster_size);
1542         if (!dic->rpages) {
1543                 kmem_cache_free(dic_entry_slab, dic);
1544                 return ERR_PTR(-ENOMEM);
1545         }
1546
1547         dic->magic = F2FS_COMPRESSED_PAGE_MAGIC;
1548         dic->inode = cc->inode;
1549         atomic_set(&dic->remaining_pages, cc->nr_cpages);
1550         dic->cluster_idx = cc->cluster_idx;
1551         dic->cluster_size = cc->cluster_size;
1552         dic->log_cluster_size = cc->log_cluster_size;
1553         dic->nr_cpages = cc->nr_cpages;
1554         refcount_set(&dic->refcnt, 1);
1555         dic->failed = false;
1556         dic->need_verity = f2fs_need_verity(cc->inode, start_idx);
1557
1558         for (i = 0; i < dic->cluster_size; i++)
1559                 dic->rpages[i] = cc->rpages[i];
1560         dic->nr_rpages = cc->cluster_size;
1561
1562         dic->cpages = page_array_alloc(dic->inode, dic->nr_cpages);
1563         if (!dic->cpages)
1564                 goto out_free;
1565
1566         for (i = 0; i < dic->nr_cpages; i++) {
1567                 struct page *page;
1568
1569                 page = f2fs_compress_alloc_page();
1570                 if (!page)
1571                         goto out_free;
1572
1573                 f2fs_set_compressed_page(page, cc->inode,
1574                                         start_idx + i + 1, dic);
1575                 dic->cpages[i] = page;
1576         }
1577
1578         return dic;
1579
1580 out_free:
1581         f2fs_free_dic(dic);
1582         return ERR_PTR(-ENOMEM);
1583 }
1584
1585 static void f2fs_free_dic(struct decompress_io_ctx *dic)
1586 {
1587         int i;
1588
1589         if (dic->tpages) {
1590                 for (i = 0; i < dic->cluster_size; i++) {
1591                         if (dic->rpages[i])
1592                                 continue;
1593                         if (!dic->tpages[i])
1594                                 continue;
1595                         f2fs_compress_free_page(dic->tpages[i]);
1596                 }
1597                 page_array_free(dic->inode, dic->tpages, dic->cluster_size);
1598         }
1599
1600         if (dic->cpages) {
1601                 for (i = 0; i < dic->nr_cpages; i++) {
1602                         if (!dic->cpages[i])
1603                                 continue;
1604                         f2fs_compress_free_page(dic->cpages[i]);
1605                 }
1606                 page_array_free(dic->inode, dic->cpages, dic->nr_cpages);
1607         }
1608
1609         page_array_free(dic->inode, dic->rpages, dic->nr_rpages);
1610         kmem_cache_free(dic_entry_slab, dic);
1611 }
1612
1613 static void f2fs_put_dic(struct decompress_io_ctx *dic)
1614 {
1615         if (refcount_dec_and_test(&dic->refcnt))
1616                 f2fs_free_dic(dic);
1617 }
1618
1619 /*
1620  * Update and unlock the cluster's pagecache pages, and release the reference to
1621  * the decompress_io_ctx that was being held for I/O completion.
1622  */
1623 static void __f2fs_decompress_end_io(struct decompress_io_ctx *dic, bool failed)
1624 {
1625         int i;
1626
1627         for (i = 0; i < dic->cluster_size; i++) {
1628                 struct page *rpage = dic->rpages[i];
1629
1630                 if (!rpage)
1631                         continue;
1632
1633                 /* PG_error was set if verity failed. */
1634                 if (failed || PageError(rpage)) {
1635                         ClearPageUptodate(rpage);
1636                         /* will re-read again later */
1637                         ClearPageError(rpage);
1638                 } else {
1639                         SetPageUptodate(rpage);
1640                 }
1641                 unlock_page(rpage);
1642         }
1643
1644         f2fs_put_dic(dic);
1645 }
1646
1647 static void f2fs_verify_cluster(struct work_struct *work)
1648 {
1649         struct decompress_io_ctx *dic =
1650                 container_of(work, struct decompress_io_ctx, verity_work);
1651         int i;
1652
1653         /* Verify the cluster's decompressed pages with fs-verity. */
1654         for (i = 0; i < dic->cluster_size; i++) {
1655                 struct page *rpage = dic->rpages[i];
1656
1657                 if (rpage && !fsverity_verify_page(rpage))
1658                         SetPageError(rpage);
1659         }
1660
1661         __f2fs_decompress_end_io(dic, false);
1662 }
1663
1664 /*
1665  * This is called when a compressed cluster has been decompressed
1666  * (or failed to be read and/or decompressed).
1667  */
1668 void f2fs_decompress_end_io(struct decompress_io_ctx *dic, bool failed)
1669 {
1670         if (!failed && dic->need_verity) {
1671                 /*
1672                  * Note that to avoid deadlocks, the verity work can't be done
1673                  * on the decompression workqueue.  This is because verifying
1674                  * the data pages can involve reading metadata pages from the
1675                  * file, and these metadata pages may be compressed.
1676                  */
1677                 INIT_WORK(&dic->verity_work, f2fs_verify_cluster);
1678                 fsverity_enqueue_verify_work(&dic->verity_work);
1679         } else {
1680                 __f2fs_decompress_end_io(dic, failed);
1681         }
1682 }
1683
1684 /*
1685  * Put a reference to a compressed page's decompress_io_ctx.
1686  *
1687  * This is called when the page is no longer needed and can be freed.
1688  */
1689 void f2fs_put_page_dic(struct page *page)
1690 {
1691         struct decompress_io_ctx *dic =
1692                         (struct decompress_io_ctx *)page_private(page);
1693
1694         f2fs_put_dic(dic);
1695 }
1696
1697 int f2fs_init_page_array_cache(struct f2fs_sb_info *sbi)
1698 {
1699         dev_t dev = sbi->sb->s_bdev->bd_dev;
1700         char slab_name[32];
1701
1702         sprintf(slab_name, "f2fs_page_array_entry-%u:%u", MAJOR(dev), MINOR(dev));
1703
1704         sbi->page_array_slab_size = sizeof(struct page *) <<
1705                                         F2FS_OPTION(sbi).compress_log_size;
1706
1707         sbi->page_array_slab = f2fs_kmem_cache_create(slab_name,
1708                                         sbi->page_array_slab_size);
1709         if (!sbi->page_array_slab)
1710                 return -ENOMEM;
1711         return 0;
1712 }
1713
1714 void f2fs_destroy_page_array_cache(struct f2fs_sb_info *sbi)
1715 {
1716         kmem_cache_destroy(sbi->page_array_slab);
1717 }
1718
1719 static int __init f2fs_init_cic_cache(void)
1720 {
1721         cic_entry_slab = f2fs_kmem_cache_create("f2fs_cic_entry",
1722                                         sizeof(struct compress_io_ctx));
1723         if (!cic_entry_slab)
1724                 return -ENOMEM;
1725         return 0;
1726 }
1727
1728 static void f2fs_destroy_cic_cache(void)
1729 {
1730         kmem_cache_destroy(cic_entry_slab);
1731 }
1732
1733 static int __init f2fs_init_dic_cache(void)
1734 {
1735         dic_entry_slab = f2fs_kmem_cache_create("f2fs_dic_entry",
1736                                         sizeof(struct decompress_io_ctx));
1737         if (!dic_entry_slab)
1738                 return -ENOMEM;
1739         return 0;
1740 }
1741
1742 static void f2fs_destroy_dic_cache(void)
1743 {
1744         kmem_cache_destroy(dic_entry_slab);
1745 }
1746
1747 int __init f2fs_init_compress_cache(void)
1748 {
1749         int err;
1750
1751         err = f2fs_init_cic_cache();
1752         if (err)
1753                 goto out;
1754         err = f2fs_init_dic_cache();
1755         if (err)
1756                 goto free_cic;
1757         return 0;
1758 free_cic:
1759         f2fs_destroy_cic_cache();
1760 out:
1761         return -ENOMEM;
1762 }
1763
1764 void f2fs_destroy_compress_cache(void)
1765 {
1766         f2fs_destroy_dic_cache();
1767         f2fs_destroy_cic_cache();
1768 }