Merge tag 'for-linus' of git://git.kernel.org/pub/scm/virt/kvm/kvm
[linux-2.6-microblaze.git] / fs / f2fs / compress.c
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  * f2fs compress support
4  *
5  * Copyright (c) 2019 Chao Yu <chao@kernel.org>
6  */
7
8 #include <linux/fs.h>
9 #include <linux/f2fs_fs.h>
10 #include <linux/writeback.h>
11 #include <linux/backing-dev.h>
12 #include <linux/lzo.h>
13 #include <linux/lz4.h>
14 #include <linux/zstd.h>
15
16 #include "f2fs.h"
17 #include "node.h"
18 #include <trace/events/f2fs.h>
19
20 static struct kmem_cache *cic_entry_slab;
21 static struct kmem_cache *dic_entry_slab;
22
23 static void *page_array_alloc(struct inode *inode, int nr)
24 {
25         struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
26         unsigned int size = sizeof(struct page *) * nr;
27
28         if (likely(size <= sbi->page_array_slab_size))
29                 return kmem_cache_zalloc(sbi->page_array_slab, GFP_NOFS);
30         return f2fs_kzalloc(sbi, size, GFP_NOFS);
31 }
32
33 static void page_array_free(struct inode *inode, void *pages, int nr)
34 {
35         struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
36         unsigned int size = sizeof(struct page *) * nr;
37
38         if (!pages)
39                 return;
40
41         if (likely(size <= sbi->page_array_slab_size))
42                 kmem_cache_free(sbi->page_array_slab, pages);
43         else
44                 kfree(pages);
45 }
46
47 struct f2fs_compress_ops {
48         int (*init_compress_ctx)(struct compress_ctx *cc);
49         void (*destroy_compress_ctx)(struct compress_ctx *cc);
50         int (*compress_pages)(struct compress_ctx *cc);
51         int (*init_decompress_ctx)(struct decompress_io_ctx *dic);
52         void (*destroy_decompress_ctx)(struct decompress_io_ctx *dic);
53         int (*decompress_pages)(struct decompress_io_ctx *dic);
54 };
55
56 static unsigned int offset_in_cluster(struct compress_ctx *cc, pgoff_t index)
57 {
58         return index & (cc->cluster_size - 1);
59 }
60
61 static pgoff_t cluster_idx(struct compress_ctx *cc, pgoff_t index)
62 {
63         return index >> cc->log_cluster_size;
64 }
65
66 static pgoff_t start_idx_of_cluster(struct compress_ctx *cc)
67 {
68         return cc->cluster_idx << cc->log_cluster_size;
69 }
70
71 bool f2fs_is_compressed_page(struct page *page)
72 {
73         if (!PagePrivate(page))
74                 return false;
75         if (!page_private(page))
76                 return false;
77         if (IS_ATOMIC_WRITTEN_PAGE(page) || IS_DUMMY_WRITTEN_PAGE(page))
78                 return false;
79         /*
80          * page->private may be set with pid.
81          * pid_max is enough to check if it is traced.
82          */
83         if (IS_IO_TRACED_PAGE(page))
84                 return false;
85
86         f2fs_bug_on(F2FS_M_SB(page->mapping),
87                 *((u32 *)page_private(page)) != F2FS_COMPRESSED_PAGE_MAGIC);
88         return true;
89 }
90
91 static void f2fs_set_compressed_page(struct page *page,
92                 struct inode *inode, pgoff_t index, void *data)
93 {
94         SetPagePrivate(page);
95         set_page_private(page, (unsigned long)data);
96
97         /* i_crypto_info and iv index */
98         page->index = index;
99         page->mapping = inode->i_mapping;
100 }
101
102 static void f2fs_drop_rpages(struct compress_ctx *cc, int len, bool unlock)
103 {
104         int i;
105
106         for (i = 0; i < len; i++) {
107                 if (!cc->rpages[i])
108                         continue;
109                 if (unlock)
110                         unlock_page(cc->rpages[i]);
111                 else
112                         put_page(cc->rpages[i]);
113         }
114 }
115
116 static void f2fs_put_rpages(struct compress_ctx *cc)
117 {
118         f2fs_drop_rpages(cc, cc->cluster_size, false);
119 }
120
121 static void f2fs_unlock_rpages(struct compress_ctx *cc, int len)
122 {
123         f2fs_drop_rpages(cc, len, true);
124 }
125
126 static void f2fs_put_rpages_mapping(struct address_space *mapping,
127                                 pgoff_t start, int len)
128 {
129         int i;
130
131         for (i = 0; i < len; i++) {
132                 struct page *page = find_get_page(mapping, start + i);
133
134                 put_page(page);
135                 put_page(page);
136         }
137 }
138
139 static void f2fs_put_rpages_wbc(struct compress_ctx *cc,
140                 struct writeback_control *wbc, bool redirty, int unlock)
141 {
142         unsigned int i;
143
144         for (i = 0; i < cc->cluster_size; i++) {
145                 if (!cc->rpages[i])
146                         continue;
147                 if (redirty)
148                         redirty_page_for_writepage(wbc, cc->rpages[i]);
149                 f2fs_put_page(cc->rpages[i], unlock);
150         }
151 }
152
153 struct page *f2fs_compress_control_page(struct page *page)
154 {
155         return ((struct compress_io_ctx *)page_private(page))->rpages[0];
156 }
157
158 int f2fs_init_compress_ctx(struct compress_ctx *cc)
159 {
160         if (cc->rpages)
161                 return 0;
162
163         cc->rpages = page_array_alloc(cc->inode, cc->cluster_size);
164         return cc->rpages ? 0 : -ENOMEM;
165 }
166
167 void f2fs_destroy_compress_ctx(struct compress_ctx *cc)
168 {
169         page_array_free(cc->inode, cc->rpages, cc->cluster_size);
170         cc->rpages = NULL;
171         cc->nr_rpages = 0;
172         cc->nr_cpages = 0;
173         cc->cluster_idx = NULL_CLUSTER;
174 }
175
176 void f2fs_compress_ctx_add_page(struct compress_ctx *cc, struct page *page)
177 {
178         unsigned int cluster_ofs;
179
180         if (!f2fs_cluster_can_merge_page(cc, page->index))
181                 f2fs_bug_on(F2FS_I_SB(cc->inode), 1);
182
183         cluster_ofs = offset_in_cluster(cc, page->index);
184         cc->rpages[cluster_ofs] = page;
185         cc->nr_rpages++;
186         cc->cluster_idx = cluster_idx(cc, page->index);
187 }
188
189 #ifdef CONFIG_F2FS_FS_LZO
190 static int lzo_init_compress_ctx(struct compress_ctx *cc)
191 {
192         cc->private = f2fs_kvmalloc(F2FS_I_SB(cc->inode),
193                                 LZO1X_MEM_COMPRESS, GFP_NOFS);
194         if (!cc->private)
195                 return -ENOMEM;
196
197         cc->clen = lzo1x_worst_compress(PAGE_SIZE << cc->log_cluster_size);
198         return 0;
199 }
200
201 static void lzo_destroy_compress_ctx(struct compress_ctx *cc)
202 {
203         kvfree(cc->private);
204         cc->private = NULL;
205 }
206
207 static int lzo_compress_pages(struct compress_ctx *cc)
208 {
209         int ret;
210
211         ret = lzo1x_1_compress(cc->rbuf, cc->rlen, cc->cbuf->cdata,
212                                         &cc->clen, cc->private);
213         if (ret != LZO_E_OK) {
214                 printk_ratelimited("%sF2FS-fs (%s): lzo compress failed, ret:%d\n",
215                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id, ret);
216                 return -EIO;
217         }
218         return 0;
219 }
220
221 static int lzo_decompress_pages(struct decompress_io_ctx *dic)
222 {
223         int ret;
224
225         ret = lzo1x_decompress_safe(dic->cbuf->cdata, dic->clen,
226                                                 dic->rbuf, &dic->rlen);
227         if (ret != LZO_E_OK) {
228                 printk_ratelimited("%sF2FS-fs (%s): lzo decompress failed, ret:%d\n",
229                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id, ret);
230                 return -EIO;
231         }
232
233         if (dic->rlen != PAGE_SIZE << dic->log_cluster_size) {
234                 printk_ratelimited("%sF2FS-fs (%s): lzo invalid rlen:%zu, "
235                                         "expected:%lu\n", KERN_ERR,
236                                         F2FS_I_SB(dic->inode)->sb->s_id,
237                                         dic->rlen,
238                                         PAGE_SIZE << dic->log_cluster_size);
239                 return -EIO;
240         }
241         return 0;
242 }
243
244 static const struct f2fs_compress_ops f2fs_lzo_ops = {
245         .init_compress_ctx      = lzo_init_compress_ctx,
246         .destroy_compress_ctx   = lzo_destroy_compress_ctx,
247         .compress_pages         = lzo_compress_pages,
248         .decompress_pages       = lzo_decompress_pages,
249 };
250 #endif
251
252 #ifdef CONFIG_F2FS_FS_LZ4
253 static int lz4_init_compress_ctx(struct compress_ctx *cc)
254 {
255         unsigned int size = LZ4_MEM_COMPRESS;
256
257 #ifdef CONFIG_F2FS_FS_LZ4HC
258         if (F2FS_I(cc->inode)->i_compress_flag >> COMPRESS_LEVEL_OFFSET)
259                 size = LZ4HC_MEM_COMPRESS;
260 #endif
261
262         cc->private = f2fs_kvmalloc(F2FS_I_SB(cc->inode), size, GFP_NOFS);
263         if (!cc->private)
264                 return -ENOMEM;
265
266         /*
267          * we do not change cc->clen to LZ4_compressBound(inputsize) to
268          * adapt worst compress case, because lz4 compressor can handle
269          * output budget properly.
270          */
271         cc->clen = cc->rlen - PAGE_SIZE - COMPRESS_HEADER_SIZE;
272         return 0;
273 }
274
275 static void lz4_destroy_compress_ctx(struct compress_ctx *cc)
276 {
277         kvfree(cc->private);
278         cc->private = NULL;
279 }
280
281 #ifdef CONFIG_F2FS_FS_LZ4HC
282 static int lz4hc_compress_pages(struct compress_ctx *cc)
283 {
284         unsigned char level = F2FS_I(cc->inode)->i_compress_flag >>
285                                                 COMPRESS_LEVEL_OFFSET;
286         int len;
287
288         if (level)
289                 len = LZ4_compress_HC(cc->rbuf, cc->cbuf->cdata, cc->rlen,
290                                         cc->clen, level, cc->private);
291         else
292                 len = LZ4_compress_default(cc->rbuf, cc->cbuf->cdata, cc->rlen,
293                                                 cc->clen, cc->private);
294         if (!len)
295                 return -EAGAIN;
296
297         cc->clen = len;
298         return 0;
299 }
300 #endif
301
302 static int lz4_compress_pages(struct compress_ctx *cc)
303 {
304         int len;
305
306 #ifdef CONFIG_F2FS_FS_LZ4HC
307         return lz4hc_compress_pages(cc);
308 #endif
309         len = LZ4_compress_default(cc->rbuf, cc->cbuf->cdata, cc->rlen,
310                                                 cc->clen, cc->private);
311         if (!len)
312                 return -EAGAIN;
313
314         cc->clen = len;
315         return 0;
316 }
317
318 static int lz4_decompress_pages(struct decompress_io_ctx *dic)
319 {
320         int ret;
321
322         ret = LZ4_decompress_safe(dic->cbuf->cdata, dic->rbuf,
323                                                 dic->clen, dic->rlen);
324         if (ret < 0) {
325                 printk_ratelimited("%sF2FS-fs (%s): lz4 decompress failed, ret:%d\n",
326                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id, ret);
327                 return -EIO;
328         }
329
330         if (ret != PAGE_SIZE << dic->log_cluster_size) {
331                 printk_ratelimited("%sF2FS-fs (%s): lz4 invalid rlen:%zu, "
332                                         "expected:%lu\n", KERN_ERR,
333                                         F2FS_I_SB(dic->inode)->sb->s_id,
334                                         dic->rlen,
335                                         PAGE_SIZE << dic->log_cluster_size);
336                 return -EIO;
337         }
338         return 0;
339 }
340
341 static const struct f2fs_compress_ops f2fs_lz4_ops = {
342         .init_compress_ctx      = lz4_init_compress_ctx,
343         .destroy_compress_ctx   = lz4_destroy_compress_ctx,
344         .compress_pages         = lz4_compress_pages,
345         .decompress_pages       = lz4_decompress_pages,
346 };
347 #endif
348
349 #ifdef CONFIG_F2FS_FS_ZSTD
350 #define F2FS_ZSTD_DEFAULT_CLEVEL        1
351
352 static int zstd_init_compress_ctx(struct compress_ctx *cc)
353 {
354         ZSTD_parameters params;
355         ZSTD_CStream *stream;
356         void *workspace;
357         unsigned int workspace_size;
358         unsigned char level = F2FS_I(cc->inode)->i_compress_flag >>
359                                                 COMPRESS_LEVEL_OFFSET;
360
361         if (!level)
362                 level = F2FS_ZSTD_DEFAULT_CLEVEL;
363
364         params = ZSTD_getParams(level, cc->rlen, 0);
365         workspace_size = ZSTD_CStreamWorkspaceBound(params.cParams);
366
367         workspace = f2fs_kvmalloc(F2FS_I_SB(cc->inode),
368                                         workspace_size, GFP_NOFS);
369         if (!workspace)
370                 return -ENOMEM;
371
372         stream = ZSTD_initCStream(params, 0, workspace, workspace_size);
373         if (!stream) {
374                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_initCStream failed\n",
375                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id,
376                                 __func__);
377                 kvfree(workspace);
378                 return -EIO;
379         }
380
381         cc->private = workspace;
382         cc->private2 = stream;
383
384         cc->clen = cc->rlen - PAGE_SIZE - COMPRESS_HEADER_SIZE;
385         return 0;
386 }
387
388 static void zstd_destroy_compress_ctx(struct compress_ctx *cc)
389 {
390         kvfree(cc->private);
391         cc->private = NULL;
392         cc->private2 = NULL;
393 }
394
395 static int zstd_compress_pages(struct compress_ctx *cc)
396 {
397         ZSTD_CStream *stream = cc->private2;
398         ZSTD_inBuffer inbuf;
399         ZSTD_outBuffer outbuf;
400         int src_size = cc->rlen;
401         int dst_size = src_size - PAGE_SIZE - COMPRESS_HEADER_SIZE;
402         int ret;
403
404         inbuf.pos = 0;
405         inbuf.src = cc->rbuf;
406         inbuf.size = src_size;
407
408         outbuf.pos = 0;
409         outbuf.dst = cc->cbuf->cdata;
410         outbuf.size = dst_size;
411
412         ret = ZSTD_compressStream(stream, &outbuf, &inbuf);
413         if (ZSTD_isError(ret)) {
414                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_compressStream failed, ret: %d\n",
415                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id,
416                                 __func__, ZSTD_getErrorCode(ret));
417                 return -EIO;
418         }
419
420         ret = ZSTD_endStream(stream, &outbuf);
421         if (ZSTD_isError(ret)) {
422                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_endStream returned %d\n",
423                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id,
424                                 __func__, ZSTD_getErrorCode(ret));
425                 return -EIO;
426         }
427
428         /*
429          * there is compressed data remained in intermediate buffer due to
430          * no more space in cbuf.cdata
431          */
432         if (ret)
433                 return -EAGAIN;
434
435         cc->clen = outbuf.pos;
436         return 0;
437 }
438
439 static int zstd_init_decompress_ctx(struct decompress_io_ctx *dic)
440 {
441         ZSTD_DStream *stream;
442         void *workspace;
443         unsigned int workspace_size;
444         unsigned int max_window_size =
445                         MAX_COMPRESS_WINDOW_SIZE(dic->log_cluster_size);
446
447         workspace_size = ZSTD_DStreamWorkspaceBound(max_window_size);
448
449         workspace = f2fs_kvmalloc(F2FS_I_SB(dic->inode),
450                                         workspace_size, GFP_NOFS);
451         if (!workspace)
452                 return -ENOMEM;
453
454         stream = ZSTD_initDStream(max_window_size, workspace, workspace_size);
455         if (!stream) {
456                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_initDStream failed\n",
457                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id,
458                                 __func__);
459                 kvfree(workspace);
460                 return -EIO;
461         }
462
463         dic->private = workspace;
464         dic->private2 = stream;
465
466         return 0;
467 }
468
469 static void zstd_destroy_decompress_ctx(struct decompress_io_ctx *dic)
470 {
471         kvfree(dic->private);
472         dic->private = NULL;
473         dic->private2 = NULL;
474 }
475
476 static int zstd_decompress_pages(struct decompress_io_ctx *dic)
477 {
478         ZSTD_DStream *stream = dic->private2;
479         ZSTD_inBuffer inbuf;
480         ZSTD_outBuffer outbuf;
481         int ret;
482
483         inbuf.pos = 0;
484         inbuf.src = dic->cbuf->cdata;
485         inbuf.size = dic->clen;
486
487         outbuf.pos = 0;
488         outbuf.dst = dic->rbuf;
489         outbuf.size = dic->rlen;
490
491         ret = ZSTD_decompressStream(stream, &outbuf, &inbuf);
492         if (ZSTD_isError(ret)) {
493                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD_compressStream failed, ret: %d\n",
494                                 KERN_ERR, F2FS_I_SB(dic->inode)->sb->s_id,
495                                 __func__, ZSTD_getErrorCode(ret));
496                 return -EIO;
497         }
498
499         if (dic->rlen != outbuf.pos) {
500                 printk_ratelimited("%sF2FS-fs (%s): %s ZSTD invalid rlen:%zu, "
501                                 "expected:%lu\n", KERN_ERR,
502                                 F2FS_I_SB(dic->inode)->sb->s_id,
503                                 __func__, dic->rlen,
504                                 PAGE_SIZE << dic->log_cluster_size);
505                 return -EIO;
506         }
507
508         return 0;
509 }
510
511 static const struct f2fs_compress_ops f2fs_zstd_ops = {
512         .init_compress_ctx      = zstd_init_compress_ctx,
513         .destroy_compress_ctx   = zstd_destroy_compress_ctx,
514         .compress_pages         = zstd_compress_pages,
515         .init_decompress_ctx    = zstd_init_decompress_ctx,
516         .destroy_decompress_ctx = zstd_destroy_decompress_ctx,
517         .decompress_pages       = zstd_decompress_pages,
518 };
519 #endif
520
521 #ifdef CONFIG_F2FS_FS_LZO
522 #ifdef CONFIG_F2FS_FS_LZORLE
523 static int lzorle_compress_pages(struct compress_ctx *cc)
524 {
525         int ret;
526
527         ret = lzorle1x_1_compress(cc->rbuf, cc->rlen, cc->cbuf->cdata,
528                                         &cc->clen, cc->private);
529         if (ret != LZO_E_OK) {
530                 printk_ratelimited("%sF2FS-fs (%s): lzo-rle compress failed, ret:%d\n",
531                                 KERN_ERR, F2FS_I_SB(cc->inode)->sb->s_id, ret);
532                 return -EIO;
533         }
534         return 0;
535 }
536
537 static const struct f2fs_compress_ops f2fs_lzorle_ops = {
538         .init_compress_ctx      = lzo_init_compress_ctx,
539         .destroy_compress_ctx   = lzo_destroy_compress_ctx,
540         .compress_pages         = lzorle_compress_pages,
541         .decompress_pages       = lzo_decompress_pages,
542 };
543 #endif
544 #endif
545
546 static const struct f2fs_compress_ops *f2fs_cops[COMPRESS_MAX] = {
547 #ifdef CONFIG_F2FS_FS_LZO
548         &f2fs_lzo_ops,
549 #else
550         NULL,
551 #endif
552 #ifdef CONFIG_F2FS_FS_LZ4
553         &f2fs_lz4_ops,
554 #else
555         NULL,
556 #endif
557 #ifdef CONFIG_F2FS_FS_ZSTD
558         &f2fs_zstd_ops,
559 #else
560         NULL,
561 #endif
562 #if defined(CONFIG_F2FS_FS_LZO) && defined(CONFIG_F2FS_FS_LZORLE)
563         &f2fs_lzorle_ops,
564 #else
565         NULL,
566 #endif
567 };
568
569 bool f2fs_is_compress_backend_ready(struct inode *inode)
570 {
571         if (!f2fs_compressed_file(inode))
572                 return true;
573         return f2fs_cops[F2FS_I(inode)->i_compress_algorithm];
574 }
575
576 static mempool_t *compress_page_pool;
577 static int num_compress_pages = 512;
578 module_param(num_compress_pages, uint, 0444);
579 MODULE_PARM_DESC(num_compress_pages,
580                 "Number of intermediate compress pages to preallocate");
581
582 int f2fs_init_compress_mempool(void)
583 {
584         compress_page_pool = mempool_create_page_pool(num_compress_pages, 0);
585         if (!compress_page_pool)
586                 return -ENOMEM;
587
588         return 0;
589 }
590
591 void f2fs_destroy_compress_mempool(void)
592 {
593         mempool_destroy(compress_page_pool);
594 }
595
596 static struct page *f2fs_compress_alloc_page(void)
597 {
598         struct page *page;
599
600         page = mempool_alloc(compress_page_pool, GFP_NOFS);
601         lock_page(page);
602
603         return page;
604 }
605
606 static void f2fs_compress_free_page(struct page *page)
607 {
608         if (!page)
609                 return;
610         set_page_private(page, (unsigned long)NULL);
611         ClearPagePrivate(page);
612         page->mapping = NULL;
613         unlock_page(page);
614         mempool_free(page, compress_page_pool);
615 }
616
617 #define MAX_VMAP_RETRIES        3
618
619 static void *f2fs_vmap(struct page **pages, unsigned int count)
620 {
621         int i;
622         void *buf = NULL;
623
624         for (i = 0; i < MAX_VMAP_RETRIES; i++) {
625                 buf = vm_map_ram(pages, count, -1);
626                 if (buf)
627                         break;
628                 vm_unmap_aliases();
629         }
630         return buf;
631 }
632
633 static int f2fs_compress_pages(struct compress_ctx *cc)
634 {
635         struct f2fs_inode_info *fi = F2FS_I(cc->inode);
636         const struct f2fs_compress_ops *cops =
637                                 f2fs_cops[fi->i_compress_algorithm];
638         unsigned int max_len, new_nr_cpages;
639         struct page **new_cpages;
640         u32 chksum = 0;
641         int i, ret;
642
643         trace_f2fs_compress_pages_start(cc->inode, cc->cluster_idx,
644                                 cc->cluster_size, fi->i_compress_algorithm);
645
646         if (cops->init_compress_ctx) {
647                 ret = cops->init_compress_ctx(cc);
648                 if (ret)
649                         goto out;
650         }
651
652         max_len = COMPRESS_HEADER_SIZE + cc->clen;
653         cc->nr_cpages = DIV_ROUND_UP(max_len, PAGE_SIZE);
654
655         cc->cpages = page_array_alloc(cc->inode, cc->nr_cpages);
656         if (!cc->cpages) {
657                 ret = -ENOMEM;
658                 goto destroy_compress_ctx;
659         }
660
661         for (i = 0; i < cc->nr_cpages; i++) {
662                 cc->cpages[i] = f2fs_compress_alloc_page();
663                 if (!cc->cpages[i]) {
664                         ret = -ENOMEM;
665                         goto out_free_cpages;
666                 }
667         }
668
669         cc->rbuf = f2fs_vmap(cc->rpages, cc->cluster_size);
670         if (!cc->rbuf) {
671                 ret = -ENOMEM;
672                 goto out_free_cpages;
673         }
674
675         cc->cbuf = f2fs_vmap(cc->cpages, cc->nr_cpages);
676         if (!cc->cbuf) {
677                 ret = -ENOMEM;
678                 goto out_vunmap_rbuf;
679         }
680
681         ret = cops->compress_pages(cc);
682         if (ret)
683                 goto out_vunmap_cbuf;
684
685         max_len = PAGE_SIZE * (cc->cluster_size - 1) - COMPRESS_HEADER_SIZE;
686
687         if (cc->clen > max_len) {
688                 ret = -EAGAIN;
689                 goto out_vunmap_cbuf;
690         }
691
692         cc->cbuf->clen = cpu_to_le32(cc->clen);
693
694         if (fi->i_compress_flag & 1 << COMPRESS_CHKSUM)
695                 chksum = f2fs_crc32(F2FS_I_SB(cc->inode),
696                                         cc->cbuf->cdata, cc->clen);
697         cc->cbuf->chksum = cpu_to_le32(chksum);
698
699         for (i = 0; i < COMPRESS_DATA_RESERVED_SIZE; i++)
700                 cc->cbuf->reserved[i] = cpu_to_le32(0);
701
702         new_nr_cpages = DIV_ROUND_UP(cc->clen + COMPRESS_HEADER_SIZE, PAGE_SIZE);
703
704         /* Now we're going to cut unnecessary tail pages */
705         new_cpages = page_array_alloc(cc->inode, new_nr_cpages);
706         if (!new_cpages) {
707                 ret = -ENOMEM;
708                 goto out_vunmap_cbuf;
709         }
710
711         /* zero out any unused part of the last page */
712         memset(&cc->cbuf->cdata[cc->clen], 0,
713                         (new_nr_cpages * PAGE_SIZE) -
714                         (cc->clen + COMPRESS_HEADER_SIZE));
715
716         vm_unmap_ram(cc->cbuf, cc->nr_cpages);
717         vm_unmap_ram(cc->rbuf, cc->cluster_size);
718
719         for (i = 0; i < cc->nr_cpages; i++) {
720                 if (i < new_nr_cpages) {
721                         new_cpages[i] = cc->cpages[i];
722                         continue;
723                 }
724                 f2fs_compress_free_page(cc->cpages[i]);
725                 cc->cpages[i] = NULL;
726         }
727
728         if (cops->destroy_compress_ctx)
729                 cops->destroy_compress_ctx(cc);
730
731         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
732         cc->cpages = new_cpages;
733         cc->nr_cpages = new_nr_cpages;
734
735         trace_f2fs_compress_pages_end(cc->inode, cc->cluster_idx,
736                                                         cc->clen, ret);
737         return 0;
738
739 out_vunmap_cbuf:
740         vm_unmap_ram(cc->cbuf, cc->nr_cpages);
741 out_vunmap_rbuf:
742         vm_unmap_ram(cc->rbuf, cc->cluster_size);
743 out_free_cpages:
744         for (i = 0; i < cc->nr_cpages; i++) {
745                 if (cc->cpages[i])
746                         f2fs_compress_free_page(cc->cpages[i]);
747         }
748         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
749         cc->cpages = NULL;
750 destroy_compress_ctx:
751         if (cops->destroy_compress_ctx)
752                 cops->destroy_compress_ctx(cc);
753 out:
754         trace_f2fs_compress_pages_end(cc->inode, cc->cluster_idx,
755                                                         cc->clen, ret);
756         return ret;
757 }
758
759 static void f2fs_decompress_cluster(struct decompress_io_ctx *dic)
760 {
761         struct f2fs_sb_info *sbi = F2FS_I_SB(dic->inode);
762         struct f2fs_inode_info *fi = F2FS_I(dic->inode);
763         const struct f2fs_compress_ops *cops =
764                         f2fs_cops[fi->i_compress_algorithm];
765         int ret;
766         int i;
767
768         trace_f2fs_decompress_pages_start(dic->inode, dic->cluster_idx,
769                                 dic->cluster_size, fi->i_compress_algorithm);
770
771         if (dic->failed) {
772                 ret = -EIO;
773                 goto out_end_io;
774         }
775
776         dic->tpages = page_array_alloc(dic->inode, dic->cluster_size);
777         if (!dic->tpages) {
778                 ret = -ENOMEM;
779                 goto out_end_io;
780         }
781
782         for (i = 0; i < dic->cluster_size; i++) {
783                 if (dic->rpages[i]) {
784                         dic->tpages[i] = dic->rpages[i];
785                         continue;
786                 }
787
788                 dic->tpages[i] = f2fs_compress_alloc_page();
789                 if (!dic->tpages[i]) {
790                         ret = -ENOMEM;
791                         goto out_end_io;
792                 }
793         }
794
795         if (cops->init_decompress_ctx) {
796                 ret = cops->init_decompress_ctx(dic);
797                 if (ret)
798                         goto out_end_io;
799         }
800
801         dic->rbuf = f2fs_vmap(dic->tpages, dic->cluster_size);
802         if (!dic->rbuf) {
803                 ret = -ENOMEM;
804                 goto out_destroy_decompress_ctx;
805         }
806
807         dic->cbuf = f2fs_vmap(dic->cpages, dic->nr_cpages);
808         if (!dic->cbuf) {
809                 ret = -ENOMEM;
810                 goto out_vunmap_rbuf;
811         }
812
813         dic->clen = le32_to_cpu(dic->cbuf->clen);
814         dic->rlen = PAGE_SIZE << dic->log_cluster_size;
815
816         if (dic->clen > PAGE_SIZE * dic->nr_cpages - COMPRESS_HEADER_SIZE) {
817                 ret = -EFSCORRUPTED;
818                 goto out_vunmap_cbuf;
819         }
820
821         ret = cops->decompress_pages(dic);
822
823         if (!ret && (fi->i_compress_flag & 1 << COMPRESS_CHKSUM)) {
824                 u32 provided = le32_to_cpu(dic->cbuf->chksum);
825                 u32 calculated = f2fs_crc32(sbi, dic->cbuf->cdata, dic->clen);
826
827                 if (provided != calculated) {
828                         if (!is_inode_flag_set(dic->inode, FI_COMPRESS_CORRUPT)) {
829                                 set_inode_flag(dic->inode, FI_COMPRESS_CORRUPT);
830                                 printk_ratelimited(
831                                         "%sF2FS-fs (%s): checksum invalid, nid = %lu, %x vs %x",
832                                         KERN_INFO, sbi->sb->s_id, dic->inode->i_ino,
833                                         provided, calculated);
834                         }
835                         set_sbi_flag(sbi, SBI_NEED_FSCK);
836                 }
837         }
838
839 out_vunmap_cbuf:
840         vm_unmap_ram(dic->cbuf, dic->nr_cpages);
841 out_vunmap_rbuf:
842         vm_unmap_ram(dic->rbuf, dic->cluster_size);
843 out_destroy_decompress_ctx:
844         if (cops->destroy_decompress_ctx)
845                 cops->destroy_decompress_ctx(dic);
846 out_end_io:
847         trace_f2fs_decompress_pages_end(dic->inode, dic->cluster_idx,
848                                                         dic->clen, ret);
849         f2fs_decompress_end_io(dic, ret);
850 }
851
852 /*
853  * This is called when a page of a compressed cluster has been read from disk
854  * (or failed to be read from disk).  It checks whether this page was the last
855  * page being waited on in the cluster, and if so, it decompresses the cluster
856  * (or in the case of a failure, cleans up without actually decompressing).
857  */
858 void f2fs_end_read_compressed_page(struct page *page, bool failed)
859 {
860         struct decompress_io_ctx *dic =
861                         (struct decompress_io_ctx *)page_private(page);
862         struct f2fs_sb_info *sbi = F2FS_I_SB(dic->inode);
863
864         dec_page_count(sbi, F2FS_RD_DATA);
865
866         if (failed)
867                 WRITE_ONCE(dic->failed, true);
868
869         if (atomic_dec_and_test(&dic->remaining_pages))
870                 f2fs_decompress_cluster(dic);
871 }
872
873 static bool is_page_in_cluster(struct compress_ctx *cc, pgoff_t index)
874 {
875         if (cc->cluster_idx == NULL_CLUSTER)
876                 return true;
877         return cc->cluster_idx == cluster_idx(cc, index);
878 }
879
880 bool f2fs_cluster_is_empty(struct compress_ctx *cc)
881 {
882         return cc->nr_rpages == 0;
883 }
884
885 static bool f2fs_cluster_is_full(struct compress_ctx *cc)
886 {
887         return cc->cluster_size == cc->nr_rpages;
888 }
889
890 bool f2fs_cluster_can_merge_page(struct compress_ctx *cc, pgoff_t index)
891 {
892         if (f2fs_cluster_is_empty(cc))
893                 return true;
894         return is_page_in_cluster(cc, index);
895 }
896
897 static bool __cluster_may_compress(struct compress_ctx *cc)
898 {
899         struct f2fs_sb_info *sbi = F2FS_I_SB(cc->inode);
900         loff_t i_size = i_size_read(cc->inode);
901         unsigned nr_pages = DIV_ROUND_UP(i_size, PAGE_SIZE);
902         int i;
903
904         for (i = 0; i < cc->cluster_size; i++) {
905                 struct page *page = cc->rpages[i];
906
907                 f2fs_bug_on(sbi, !page);
908
909                 if (unlikely(f2fs_cp_error(sbi)))
910                         return false;
911                 if (unlikely(is_sbi_flag_set(sbi, SBI_POR_DOING)))
912                         return false;
913
914                 /* beyond EOF */
915                 if (page->index >= nr_pages)
916                         return false;
917         }
918         return true;
919 }
920
921 static int __f2fs_cluster_blocks(struct compress_ctx *cc, bool compr)
922 {
923         struct dnode_of_data dn;
924         int ret;
925
926         set_new_dnode(&dn, cc->inode, NULL, NULL, 0);
927         ret = f2fs_get_dnode_of_data(&dn, start_idx_of_cluster(cc),
928                                                         LOOKUP_NODE);
929         if (ret) {
930                 if (ret == -ENOENT)
931                         ret = 0;
932                 goto fail;
933         }
934
935         if (dn.data_blkaddr == COMPRESS_ADDR) {
936                 int i;
937
938                 ret = 1;
939                 for (i = 1; i < cc->cluster_size; i++) {
940                         block_t blkaddr;
941
942                         blkaddr = data_blkaddr(dn.inode,
943                                         dn.node_page, dn.ofs_in_node + i);
944                         if (compr) {
945                                 if (__is_valid_data_blkaddr(blkaddr))
946                                         ret++;
947                         } else {
948                                 if (blkaddr != NULL_ADDR)
949                                         ret++;
950                         }
951                 }
952         }
953 fail:
954         f2fs_put_dnode(&dn);
955         return ret;
956 }
957
958 /* return # of compressed blocks in compressed cluster */
959 static int f2fs_compressed_blocks(struct compress_ctx *cc)
960 {
961         return __f2fs_cluster_blocks(cc, true);
962 }
963
964 /* return # of valid blocks in compressed cluster */
965 static int f2fs_cluster_blocks(struct compress_ctx *cc)
966 {
967         return __f2fs_cluster_blocks(cc, false);
968 }
969
970 int f2fs_is_compressed_cluster(struct inode *inode, pgoff_t index)
971 {
972         struct compress_ctx cc = {
973                 .inode = inode,
974                 .log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
975                 .cluster_size = F2FS_I(inode)->i_cluster_size,
976                 .cluster_idx = index >> F2FS_I(inode)->i_log_cluster_size,
977         };
978
979         return f2fs_cluster_blocks(&cc);
980 }
981
982 static bool cluster_may_compress(struct compress_ctx *cc)
983 {
984         if (!f2fs_need_compress_data(cc->inode))
985                 return false;
986         if (f2fs_is_atomic_file(cc->inode))
987                 return false;
988         if (f2fs_is_mmap_file(cc->inode))
989                 return false;
990         if (!f2fs_cluster_is_full(cc))
991                 return false;
992         if (unlikely(f2fs_cp_error(F2FS_I_SB(cc->inode))))
993                 return false;
994         return __cluster_may_compress(cc);
995 }
996
997 static void set_cluster_writeback(struct compress_ctx *cc)
998 {
999         int i;
1000
1001         for (i = 0; i < cc->cluster_size; i++) {
1002                 if (cc->rpages[i])
1003                         set_page_writeback(cc->rpages[i]);
1004         }
1005 }
1006
1007 static void set_cluster_dirty(struct compress_ctx *cc)
1008 {
1009         int i;
1010
1011         for (i = 0; i < cc->cluster_size; i++)
1012                 if (cc->rpages[i])
1013                         set_page_dirty(cc->rpages[i]);
1014 }
1015
1016 static int prepare_compress_overwrite(struct compress_ctx *cc,
1017                 struct page **pagep, pgoff_t index, void **fsdata)
1018 {
1019         struct f2fs_sb_info *sbi = F2FS_I_SB(cc->inode);
1020         struct address_space *mapping = cc->inode->i_mapping;
1021         struct page *page;
1022         struct dnode_of_data dn;
1023         sector_t last_block_in_bio;
1024         unsigned fgp_flag = FGP_LOCK | FGP_WRITE | FGP_CREAT;
1025         pgoff_t start_idx = start_idx_of_cluster(cc);
1026         int i, ret;
1027         bool prealloc;
1028
1029 retry:
1030         ret = f2fs_cluster_blocks(cc);
1031         if (ret <= 0)
1032                 return ret;
1033
1034         /* compressed case */
1035         prealloc = (ret < cc->cluster_size);
1036
1037         ret = f2fs_init_compress_ctx(cc);
1038         if (ret)
1039                 return ret;
1040
1041         /* keep page reference to avoid page reclaim */
1042         for (i = 0; i < cc->cluster_size; i++) {
1043                 page = f2fs_pagecache_get_page(mapping, start_idx + i,
1044                                                         fgp_flag, GFP_NOFS);
1045                 if (!page) {
1046                         ret = -ENOMEM;
1047                         goto unlock_pages;
1048                 }
1049
1050                 if (PageUptodate(page))
1051                         unlock_page(page);
1052                 else
1053                         f2fs_compress_ctx_add_page(cc, page);
1054         }
1055
1056         if (!f2fs_cluster_is_empty(cc)) {
1057                 struct bio *bio = NULL;
1058
1059                 ret = f2fs_read_multi_pages(cc, &bio, cc->cluster_size,
1060                                         &last_block_in_bio, false, true);
1061                 f2fs_destroy_compress_ctx(cc);
1062                 if (ret)
1063                         goto release_pages;
1064                 if (bio)
1065                         f2fs_submit_bio(sbi, bio, DATA);
1066
1067                 ret = f2fs_init_compress_ctx(cc);
1068                 if (ret)
1069                         goto release_pages;
1070         }
1071
1072         for (i = 0; i < cc->cluster_size; i++) {
1073                 f2fs_bug_on(sbi, cc->rpages[i]);
1074
1075                 page = find_lock_page(mapping, start_idx + i);
1076                 f2fs_bug_on(sbi, !page);
1077
1078                 f2fs_wait_on_page_writeback(page, DATA, true, true);
1079
1080                 f2fs_compress_ctx_add_page(cc, page);
1081                 f2fs_put_page(page, 0);
1082
1083                 if (!PageUptodate(page)) {
1084                         f2fs_unlock_rpages(cc, i + 1);
1085                         f2fs_put_rpages_mapping(mapping, start_idx,
1086                                         cc->cluster_size);
1087                         f2fs_destroy_compress_ctx(cc);
1088                         goto retry;
1089                 }
1090         }
1091
1092         if (prealloc) {
1093                 f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, true);
1094
1095                 set_new_dnode(&dn, cc->inode, NULL, NULL, 0);
1096
1097                 for (i = cc->cluster_size - 1; i > 0; i--) {
1098                         ret = f2fs_get_block(&dn, start_idx + i);
1099                         if (ret) {
1100                                 i = cc->cluster_size;
1101                                 break;
1102                         }
1103
1104                         if (dn.data_blkaddr != NEW_ADDR)
1105                                 break;
1106                 }
1107
1108                 f2fs_do_map_lock(sbi, F2FS_GET_BLOCK_PRE_AIO, false);
1109         }
1110
1111         if (likely(!ret)) {
1112                 *fsdata = cc->rpages;
1113                 *pagep = cc->rpages[offset_in_cluster(cc, index)];
1114                 return cc->cluster_size;
1115         }
1116
1117 unlock_pages:
1118         f2fs_unlock_rpages(cc, i);
1119 release_pages:
1120         f2fs_put_rpages_mapping(mapping, start_idx, i);
1121         f2fs_destroy_compress_ctx(cc);
1122         return ret;
1123 }
1124
1125 int f2fs_prepare_compress_overwrite(struct inode *inode,
1126                 struct page **pagep, pgoff_t index, void **fsdata)
1127 {
1128         struct compress_ctx cc = {
1129                 .inode = inode,
1130                 .log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
1131                 .cluster_size = F2FS_I(inode)->i_cluster_size,
1132                 .cluster_idx = index >> F2FS_I(inode)->i_log_cluster_size,
1133                 .rpages = NULL,
1134                 .nr_rpages = 0,
1135         };
1136
1137         return prepare_compress_overwrite(&cc, pagep, index, fsdata);
1138 }
1139
1140 bool f2fs_compress_write_end(struct inode *inode, void *fsdata,
1141                                         pgoff_t index, unsigned copied)
1142
1143 {
1144         struct compress_ctx cc = {
1145                 .inode = inode,
1146                 .log_cluster_size = F2FS_I(inode)->i_log_cluster_size,
1147                 .cluster_size = F2FS_I(inode)->i_cluster_size,
1148                 .rpages = fsdata,
1149         };
1150         bool first_index = (index == cc.rpages[0]->index);
1151
1152         if (copied)
1153                 set_cluster_dirty(&cc);
1154
1155         f2fs_put_rpages_wbc(&cc, NULL, false, 1);
1156         f2fs_destroy_compress_ctx(&cc);
1157
1158         return first_index;
1159 }
1160
1161 int f2fs_truncate_partial_cluster(struct inode *inode, u64 from, bool lock)
1162 {
1163         void *fsdata = NULL;
1164         struct page *pagep;
1165         int log_cluster_size = F2FS_I(inode)->i_log_cluster_size;
1166         pgoff_t start_idx = from >> (PAGE_SHIFT + log_cluster_size) <<
1167                                                         log_cluster_size;
1168         int err;
1169
1170         err = f2fs_is_compressed_cluster(inode, start_idx);
1171         if (err < 0)
1172                 return err;
1173
1174         /* truncate normal cluster */
1175         if (!err)
1176                 return f2fs_do_truncate_blocks(inode, from, lock);
1177
1178         /* truncate compressed cluster */
1179         err = f2fs_prepare_compress_overwrite(inode, &pagep,
1180                                                 start_idx, &fsdata);
1181
1182         /* should not be a normal cluster */
1183         f2fs_bug_on(F2FS_I_SB(inode), err == 0);
1184
1185         if (err <= 0)
1186                 return err;
1187
1188         if (err > 0) {
1189                 struct page **rpages = fsdata;
1190                 int cluster_size = F2FS_I(inode)->i_cluster_size;
1191                 int i;
1192
1193                 for (i = cluster_size - 1; i >= 0; i--) {
1194                         loff_t start = rpages[i]->index << PAGE_SHIFT;
1195
1196                         if (from <= start) {
1197                                 zero_user_segment(rpages[i], 0, PAGE_SIZE);
1198                         } else {
1199                                 zero_user_segment(rpages[i], from - start,
1200                                                                 PAGE_SIZE);
1201                                 break;
1202                         }
1203                 }
1204
1205                 f2fs_compress_write_end(inode, fsdata, start_idx, true);
1206         }
1207         return 0;
1208 }
1209
1210 static int f2fs_write_compressed_pages(struct compress_ctx *cc,
1211                                         int *submitted,
1212                                         struct writeback_control *wbc,
1213                                         enum iostat_type io_type)
1214 {
1215         struct inode *inode = cc->inode;
1216         struct f2fs_sb_info *sbi = F2FS_I_SB(inode);
1217         struct f2fs_inode_info *fi = F2FS_I(inode);
1218         struct f2fs_io_info fio = {
1219                 .sbi = sbi,
1220                 .ino = cc->inode->i_ino,
1221                 .type = DATA,
1222                 .op = REQ_OP_WRITE,
1223                 .op_flags = wbc_to_write_flags(wbc),
1224                 .old_blkaddr = NEW_ADDR,
1225                 .page = NULL,
1226                 .encrypted_page = NULL,
1227                 .compressed_page = NULL,
1228                 .submitted = false,
1229                 .io_type = io_type,
1230                 .io_wbc = wbc,
1231                 .encrypted = fscrypt_inode_uses_fs_layer_crypto(cc->inode),
1232         };
1233         struct dnode_of_data dn;
1234         struct node_info ni;
1235         struct compress_io_ctx *cic;
1236         pgoff_t start_idx = start_idx_of_cluster(cc);
1237         unsigned int last_index = cc->cluster_size - 1;
1238         loff_t psize;
1239         int i, err;
1240
1241         if (IS_NOQUOTA(inode)) {
1242                 /*
1243                  * We need to wait for node_write to avoid block allocation during
1244                  * checkpoint. This can only happen to quota writes which can cause
1245                  * the below discard race condition.
1246                  */
1247                 down_read(&sbi->node_write);
1248         } else if (!f2fs_trylock_op(sbi)) {
1249                 goto out_free;
1250         }
1251
1252         set_new_dnode(&dn, cc->inode, NULL, NULL, 0);
1253
1254         err = f2fs_get_dnode_of_data(&dn, start_idx, LOOKUP_NODE);
1255         if (err)
1256                 goto out_unlock_op;
1257
1258         for (i = 0; i < cc->cluster_size; i++) {
1259                 if (data_blkaddr(dn.inode, dn.node_page,
1260                                         dn.ofs_in_node + i) == NULL_ADDR)
1261                         goto out_put_dnode;
1262         }
1263
1264         psize = (loff_t)(cc->rpages[last_index]->index + 1) << PAGE_SHIFT;
1265
1266         err = f2fs_get_node_info(fio.sbi, dn.nid, &ni);
1267         if (err)
1268                 goto out_put_dnode;
1269
1270         fio.version = ni.version;
1271
1272         cic = kmem_cache_zalloc(cic_entry_slab, GFP_NOFS);
1273         if (!cic)
1274                 goto out_put_dnode;
1275
1276         cic->magic = F2FS_COMPRESSED_PAGE_MAGIC;
1277         cic->inode = inode;
1278         atomic_set(&cic->pending_pages, cc->nr_cpages);
1279         cic->rpages = page_array_alloc(cc->inode, cc->cluster_size);
1280         if (!cic->rpages)
1281                 goto out_put_cic;
1282
1283         cic->nr_rpages = cc->cluster_size;
1284
1285         for (i = 0; i < cc->nr_cpages; i++) {
1286                 f2fs_set_compressed_page(cc->cpages[i], inode,
1287                                         cc->rpages[i + 1]->index, cic);
1288                 fio.compressed_page = cc->cpages[i];
1289
1290                 fio.old_blkaddr = data_blkaddr(dn.inode, dn.node_page,
1291                                                 dn.ofs_in_node + i + 1);
1292
1293                 /* wait for GCed page writeback via META_MAPPING */
1294                 f2fs_wait_on_block_writeback(inode, fio.old_blkaddr);
1295
1296                 if (fio.encrypted) {
1297                         fio.page = cc->rpages[i + 1];
1298                         err = f2fs_encrypt_one_page(&fio);
1299                         if (err)
1300                                 goto out_destroy_crypt;
1301                         cc->cpages[i] = fio.encrypted_page;
1302                 }
1303         }
1304
1305         set_cluster_writeback(cc);
1306
1307         for (i = 0; i < cc->cluster_size; i++)
1308                 cic->rpages[i] = cc->rpages[i];
1309
1310         for (i = 0; i < cc->cluster_size; i++, dn.ofs_in_node++) {
1311                 block_t blkaddr;
1312
1313                 blkaddr = f2fs_data_blkaddr(&dn);
1314                 fio.page = cc->rpages[i];
1315                 fio.old_blkaddr = blkaddr;
1316
1317                 /* cluster header */
1318                 if (i == 0) {
1319                         if (blkaddr == COMPRESS_ADDR)
1320                                 fio.compr_blocks++;
1321                         if (__is_valid_data_blkaddr(blkaddr))
1322                                 f2fs_invalidate_blocks(sbi, blkaddr);
1323                         f2fs_update_data_blkaddr(&dn, COMPRESS_ADDR);
1324                         goto unlock_continue;
1325                 }
1326
1327                 if (fio.compr_blocks && __is_valid_data_blkaddr(blkaddr))
1328                         fio.compr_blocks++;
1329
1330                 if (i > cc->nr_cpages) {
1331                         if (__is_valid_data_blkaddr(blkaddr)) {
1332                                 f2fs_invalidate_blocks(sbi, blkaddr);
1333                                 f2fs_update_data_blkaddr(&dn, NEW_ADDR);
1334                         }
1335                         goto unlock_continue;
1336                 }
1337
1338                 f2fs_bug_on(fio.sbi, blkaddr == NULL_ADDR);
1339
1340                 if (fio.encrypted)
1341                         fio.encrypted_page = cc->cpages[i - 1];
1342                 else
1343                         fio.compressed_page = cc->cpages[i - 1];
1344
1345                 cc->cpages[i - 1] = NULL;
1346                 f2fs_outplace_write_data(&dn, &fio);
1347                 (*submitted)++;
1348 unlock_continue:
1349                 inode_dec_dirty_pages(cc->inode);
1350                 unlock_page(fio.page);
1351         }
1352
1353         if (fio.compr_blocks)
1354                 f2fs_i_compr_blocks_update(inode, fio.compr_blocks - 1, false);
1355         f2fs_i_compr_blocks_update(inode, cc->nr_cpages, true);
1356
1357         set_inode_flag(cc->inode, FI_APPEND_WRITE);
1358         if (cc->cluster_idx == 0)
1359                 set_inode_flag(inode, FI_FIRST_BLOCK_WRITTEN);
1360
1361         f2fs_put_dnode(&dn);
1362         if (IS_NOQUOTA(inode))
1363                 up_read(&sbi->node_write);
1364         else
1365                 f2fs_unlock_op(sbi);
1366
1367         spin_lock(&fi->i_size_lock);
1368         if (fi->last_disk_size < psize)
1369                 fi->last_disk_size = psize;
1370         spin_unlock(&fi->i_size_lock);
1371
1372         f2fs_put_rpages(cc);
1373         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
1374         cc->cpages = NULL;
1375         f2fs_destroy_compress_ctx(cc);
1376         return 0;
1377
1378 out_destroy_crypt:
1379         page_array_free(cc->inode, cic->rpages, cc->cluster_size);
1380
1381         for (--i; i >= 0; i--)
1382                 fscrypt_finalize_bounce_page(&cc->cpages[i]);
1383         for (i = 0; i < cc->nr_cpages; i++) {
1384                 if (!cc->cpages[i])
1385                         continue;
1386                 f2fs_put_page(cc->cpages[i], 1);
1387         }
1388 out_put_cic:
1389         kmem_cache_free(cic_entry_slab, cic);
1390 out_put_dnode:
1391         f2fs_put_dnode(&dn);
1392 out_unlock_op:
1393         if (IS_NOQUOTA(inode))
1394                 up_read(&sbi->node_write);
1395         else
1396                 f2fs_unlock_op(sbi);
1397 out_free:
1398         page_array_free(cc->inode, cc->cpages, cc->nr_cpages);
1399         cc->cpages = NULL;
1400         return -EAGAIN;
1401 }
1402
1403 void f2fs_compress_write_end_io(struct bio *bio, struct page *page)
1404 {
1405         struct f2fs_sb_info *sbi = bio->bi_private;
1406         struct compress_io_ctx *cic =
1407                         (struct compress_io_ctx *)page_private(page);
1408         int i;
1409
1410         if (unlikely(bio->bi_status))
1411                 mapping_set_error(cic->inode->i_mapping, -EIO);
1412
1413         f2fs_compress_free_page(page);
1414
1415         dec_page_count(sbi, F2FS_WB_DATA);
1416
1417         if (atomic_dec_return(&cic->pending_pages))
1418                 return;
1419
1420         for (i = 0; i < cic->nr_rpages; i++) {
1421                 WARN_ON(!cic->rpages[i]);
1422                 clear_cold_data(cic->rpages[i]);
1423                 end_page_writeback(cic->rpages[i]);
1424         }
1425
1426         page_array_free(cic->inode, cic->rpages, cic->nr_rpages);
1427         kmem_cache_free(cic_entry_slab, cic);
1428 }
1429
1430 static int f2fs_write_raw_pages(struct compress_ctx *cc,
1431                                         int *submitted,
1432                                         struct writeback_control *wbc,
1433                                         enum iostat_type io_type)
1434 {
1435         struct address_space *mapping = cc->inode->i_mapping;
1436         int _submitted, compr_blocks, ret;
1437         int i = -1, err = 0;
1438
1439         compr_blocks = f2fs_compressed_blocks(cc);
1440         if (compr_blocks < 0) {
1441                 err = compr_blocks;
1442                 goto out_err;
1443         }
1444
1445         for (i = 0; i < cc->cluster_size; i++) {
1446                 if (!cc->rpages[i])
1447                         continue;
1448 retry_write:
1449                 if (cc->rpages[i]->mapping != mapping) {
1450                         unlock_page(cc->rpages[i]);
1451                         continue;
1452                 }
1453
1454                 BUG_ON(!PageLocked(cc->rpages[i]));
1455
1456                 ret = f2fs_write_single_data_page(cc->rpages[i], &_submitted,
1457                                                 NULL, NULL, wbc, io_type,
1458                                                 compr_blocks, false);
1459                 if (ret) {
1460                         if (ret == AOP_WRITEPAGE_ACTIVATE) {
1461                                 unlock_page(cc->rpages[i]);
1462                                 ret = 0;
1463                         } else if (ret == -EAGAIN) {
1464                                 /*
1465                                  * for quota file, just redirty left pages to
1466                                  * avoid deadlock caused by cluster update race
1467                                  * from foreground operation.
1468                                  */
1469                                 if (IS_NOQUOTA(cc->inode)) {
1470                                         err = 0;
1471                                         goto out_err;
1472                                 }
1473                                 ret = 0;
1474                                 cond_resched();
1475                                 congestion_wait(BLK_RW_ASYNC,
1476                                                 DEFAULT_IO_TIMEOUT);
1477                                 lock_page(cc->rpages[i]);
1478
1479                                 if (!PageDirty(cc->rpages[i])) {
1480                                         unlock_page(cc->rpages[i]);
1481                                         continue;
1482                                 }
1483
1484                                 clear_page_dirty_for_io(cc->rpages[i]);
1485                                 goto retry_write;
1486                         }
1487                         err = ret;
1488                         goto out_err;
1489                 }
1490
1491                 *submitted += _submitted;
1492         }
1493
1494         f2fs_balance_fs(F2FS_M_SB(mapping), true);
1495
1496         return 0;
1497 out_err:
1498         for (++i; i < cc->cluster_size; i++) {
1499                 if (!cc->rpages[i])
1500                         continue;
1501                 redirty_page_for_writepage(wbc, cc->rpages[i]);
1502                 unlock_page(cc->rpages[i]);
1503         }
1504         return err;
1505 }
1506
1507 int f2fs_write_multi_pages(struct compress_ctx *cc,
1508                                         int *submitted,
1509                                         struct writeback_control *wbc,
1510                                         enum iostat_type io_type)
1511 {
1512         int err;
1513
1514         *submitted = 0;
1515         if (cluster_may_compress(cc)) {
1516                 err = f2fs_compress_pages(cc);
1517                 if (err == -EAGAIN) {
1518                         goto write;
1519                 } else if (err) {
1520                         f2fs_put_rpages_wbc(cc, wbc, true, 1);
1521                         goto destroy_out;
1522                 }
1523
1524                 err = f2fs_write_compressed_pages(cc, submitted,
1525                                                         wbc, io_type);
1526                 if (!err)
1527                         return 0;
1528                 f2fs_bug_on(F2FS_I_SB(cc->inode), err != -EAGAIN);
1529         }
1530 write:
1531         f2fs_bug_on(F2FS_I_SB(cc->inode), *submitted);
1532
1533         err = f2fs_write_raw_pages(cc, submitted, wbc, io_type);
1534         f2fs_put_rpages_wbc(cc, wbc, false, 0);
1535 destroy_out:
1536         f2fs_destroy_compress_ctx(cc);
1537         return err;
1538 }
1539
1540 static void f2fs_free_dic(struct decompress_io_ctx *dic);
1541
1542 struct decompress_io_ctx *f2fs_alloc_dic(struct compress_ctx *cc)
1543 {
1544         struct decompress_io_ctx *dic;
1545         pgoff_t start_idx = start_idx_of_cluster(cc);
1546         int i;
1547
1548         dic = kmem_cache_zalloc(dic_entry_slab, GFP_NOFS);
1549         if (!dic)
1550                 return ERR_PTR(-ENOMEM);
1551
1552         dic->rpages = page_array_alloc(cc->inode, cc->cluster_size);
1553         if (!dic->rpages) {
1554                 kmem_cache_free(dic_entry_slab, dic);
1555                 return ERR_PTR(-ENOMEM);
1556         }
1557
1558         dic->magic = F2FS_COMPRESSED_PAGE_MAGIC;
1559         dic->inode = cc->inode;
1560         atomic_set(&dic->remaining_pages, cc->nr_cpages);
1561         dic->cluster_idx = cc->cluster_idx;
1562         dic->cluster_size = cc->cluster_size;
1563         dic->log_cluster_size = cc->log_cluster_size;
1564         dic->nr_cpages = cc->nr_cpages;
1565         refcount_set(&dic->refcnt, 1);
1566         dic->failed = false;
1567         dic->need_verity = f2fs_need_verity(cc->inode, start_idx);
1568
1569         for (i = 0; i < dic->cluster_size; i++)
1570                 dic->rpages[i] = cc->rpages[i];
1571         dic->nr_rpages = cc->cluster_size;
1572
1573         dic->cpages = page_array_alloc(dic->inode, dic->nr_cpages);
1574         if (!dic->cpages)
1575                 goto out_free;
1576
1577         for (i = 0; i < dic->nr_cpages; i++) {
1578                 struct page *page;
1579
1580                 page = f2fs_compress_alloc_page();
1581                 if (!page)
1582                         goto out_free;
1583
1584                 f2fs_set_compressed_page(page, cc->inode,
1585                                         start_idx + i + 1, dic);
1586                 dic->cpages[i] = page;
1587         }
1588
1589         return dic;
1590
1591 out_free:
1592         f2fs_free_dic(dic);
1593         return ERR_PTR(-ENOMEM);
1594 }
1595
1596 static void f2fs_free_dic(struct decompress_io_ctx *dic)
1597 {
1598         int i;
1599
1600         if (dic->tpages) {
1601                 for (i = 0; i < dic->cluster_size; i++) {
1602                         if (dic->rpages[i])
1603                                 continue;
1604                         if (!dic->tpages[i])
1605                                 continue;
1606                         f2fs_compress_free_page(dic->tpages[i]);
1607                 }
1608                 page_array_free(dic->inode, dic->tpages, dic->cluster_size);
1609         }
1610
1611         if (dic->cpages) {
1612                 for (i = 0; i < dic->nr_cpages; i++) {
1613                         if (!dic->cpages[i])
1614                                 continue;
1615                         f2fs_compress_free_page(dic->cpages[i]);
1616                 }
1617                 page_array_free(dic->inode, dic->cpages, dic->nr_cpages);
1618         }
1619
1620         page_array_free(dic->inode, dic->rpages, dic->nr_rpages);
1621         kmem_cache_free(dic_entry_slab, dic);
1622 }
1623
1624 static void f2fs_put_dic(struct decompress_io_ctx *dic)
1625 {
1626         if (refcount_dec_and_test(&dic->refcnt))
1627                 f2fs_free_dic(dic);
1628 }
1629
1630 /*
1631  * Update and unlock the cluster's pagecache pages, and release the reference to
1632  * the decompress_io_ctx that was being held for I/O completion.
1633  */
1634 static void __f2fs_decompress_end_io(struct decompress_io_ctx *dic, bool failed)
1635 {
1636         int i;
1637
1638         for (i = 0; i < dic->cluster_size; i++) {
1639                 struct page *rpage = dic->rpages[i];
1640
1641                 if (!rpage)
1642                         continue;
1643
1644                 /* PG_error was set if verity failed. */
1645                 if (failed || PageError(rpage)) {
1646                         ClearPageUptodate(rpage);
1647                         /* will re-read again later */
1648                         ClearPageError(rpage);
1649                 } else {
1650                         SetPageUptodate(rpage);
1651                 }
1652                 unlock_page(rpage);
1653         }
1654
1655         f2fs_put_dic(dic);
1656 }
1657
1658 static void f2fs_verify_cluster(struct work_struct *work)
1659 {
1660         struct decompress_io_ctx *dic =
1661                 container_of(work, struct decompress_io_ctx, verity_work);
1662         int i;
1663
1664         /* Verify the cluster's decompressed pages with fs-verity. */
1665         for (i = 0; i < dic->cluster_size; i++) {
1666                 struct page *rpage = dic->rpages[i];
1667
1668                 if (rpage && !fsverity_verify_page(rpage))
1669                         SetPageError(rpage);
1670         }
1671
1672         __f2fs_decompress_end_io(dic, false);
1673 }
1674
1675 /*
1676  * This is called when a compressed cluster has been decompressed
1677  * (or failed to be read and/or decompressed).
1678  */
1679 void f2fs_decompress_end_io(struct decompress_io_ctx *dic, bool failed)
1680 {
1681         if (!failed && dic->need_verity) {
1682                 /*
1683                  * Note that to avoid deadlocks, the verity work can't be done
1684                  * on the decompression workqueue.  This is because verifying
1685                  * the data pages can involve reading metadata pages from the
1686                  * file, and these metadata pages may be compressed.
1687                  */
1688                 INIT_WORK(&dic->verity_work, f2fs_verify_cluster);
1689                 fsverity_enqueue_verify_work(&dic->verity_work);
1690         } else {
1691                 __f2fs_decompress_end_io(dic, failed);
1692         }
1693 }
1694
1695 /*
1696  * Put a reference to a compressed page's decompress_io_ctx.
1697  *
1698  * This is called when the page is no longer needed and can be freed.
1699  */
1700 void f2fs_put_page_dic(struct page *page)
1701 {
1702         struct decompress_io_ctx *dic =
1703                         (struct decompress_io_ctx *)page_private(page);
1704
1705         f2fs_put_dic(dic);
1706 }
1707
1708 int f2fs_init_page_array_cache(struct f2fs_sb_info *sbi)
1709 {
1710         dev_t dev = sbi->sb->s_bdev->bd_dev;
1711         char slab_name[32];
1712
1713         sprintf(slab_name, "f2fs_page_array_entry-%u:%u", MAJOR(dev), MINOR(dev));
1714
1715         sbi->page_array_slab_size = sizeof(struct page *) <<
1716                                         F2FS_OPTION(sbi).compress_log_size;
1717
1718         sbi->page_array_slab = f2fs_kmem_cache_create(slab_name,
1719                                         sbi->page_array_slab_size);
1720         if (!sbi->page_array_slab)
1721                 return -ENOMEM;
1722         return 0;
1723 }
1724
1725 void f2fs_destroy_page_array_cache(struct f2fs_sb_info *sbi)
1726 {
1727         kmem_cache_destroy(sbi->page_array_slab);
1728 }
1729
1730 static int __init f2fs_init_cic_cache(void)
1731 {
1732         cic_entry_slab = f2fs_kmem_cache_create("f2fs_cic_entry",
1733                                         sizeof(struct compress_io_ctx));
1734         if (!cic_entry_slab)
1735                 return -ENOMEM;
1736         return 0;
1737 }
1738
1739 static void f2fs_destroy_cic_cache(void)
1740 {
1741         kmem_cache_destroy(cic_entry_slab);
1742 }
1743
1744 static int __init f2fs_init_dic_cache(void)
1745 {
1746         dic_entry_slab = f2fs_kmem_cache_create("f2fs_dic_entry",
1747                                         sizeof(struct decompress_io_ctx));
1748         if (!dic_entry_slab)
1749                 return -ENOMEM;
1750         return 0;
1751 }
1752
1753 static void f2fs_destroy_dic_cache(void)
1754 {
1755         kmem_cache_destroy(dic_entry_slab);
1756 }
1757
1758 int __init f2fs_init_compress_cache(void)
1759 {
1760         int err;
1761
1762         err = f2fs_init_cic_cache();
1763         if (err)
1764                 goto out;
1765         err = f2fs_init_dic_cache();
1766         if (err)
1767                 goto free_cic;
1768         return 0;
1769 free_cic:
1770         f2fs_destroy_cic_cache();
1771 out:
1772         return -ENOMEM;
1773 }
1774
1775 void f2fs_destroy_compress_cache(void)
1776 {
1777         f2fs_destroy_dic_cache();
1778         f2fs_destroy_cic_cache();
1779 }