Merge tag 'slab-for-6.5' of git://git.kernel.org/pub/scm/linux/kernel/git/vbabka...
[linux-2.6-microblaze.git] / fs / nilfs2 / sufile.c
1 // SPDX-License-Identifier: GPL-2.0+
2 /*
3  * NILFS segment usage file.
4  *
5  * Copyright (C) 2006-2008 Nippon Telegraph and Telephone Corporation.
6  *
7  * Written by Koji Sato.
8  * Revised by Ryusuke Konishi.
9  */
10
11 #include <linux/kernel.h>
12 #include <linux/fs.h>
13 #include <linux/string.h>
14 #include <linux/buffer_head.h>
15 #include <linux/errno.h>
16 #include "mdt.h"
17 #include "sufile.h"
18
19 #include <trace/events/nilfs2.h>
20
21 /**
22  * struct nilfs_sufile_info - on-memory private data of sufile
23  * @mi: on-memory private data of metadata file
24  * @ncleansegs: number of clean segments
25  * @allocmin: lower limit of allocatable segment range
26  * @allocmax: upper limit of allocatable segment range
27  */
28 struct nilfs_sufile_info {
29         struct nilfs_mdt_info mi;
30         unsigned long ncleansegs;/* number of clean segments */
31         __u64 allocmin;         /* lower limit of allocatable segment range */
32         __u64 allocmax;         /* upper limit of allocatable segment range */
33 };
34
35 static inline struct nilfs_sufile_info *NILFS_SUI(struct inode *sufile)
36 {
37         return (struct nilfs_sufile_info *)NILFS_MDT(sufile);
38 }
39
40 static inline unsigned long
41 nilfs_sufile_segment_usages_per_block(const struct inode *sufile)
42 {
43         return NILFS_MDT(sufile)->mi_entries_per_block;
44 }
45
46 static unsigned long
47 nilfs_sufile_get_blkoff(const struct inode *sufile, __u64 segnum)
48 {
49         __u64 t = segnum + NILFS_MDT(sufile)->mi_first_entry_offset;
50
51         do_div(t, nilfs_sufile_segment_usages_per_block(sufile));
52         return (unsigned long)t;
53 }
54
55 static unsigned long
56 nilfs_sufile_get_offset(const struct inode *sufile, __u64 segnum)
57 {
58         __u64 t = segnum + NILFS_MDT(sufile)->mi_first_entry_offset;
59
60         return do_div(t, nilfs_sufile_segment_usages_per_block(sufile));
61 }
62
63 static unsigned long
64 nilfs_sufile_segment_usages_in_block(const struct inode *sufile, __u64 curr,
65                                      __u64 max)
66 {
67         return min_t(unsigned long,
68                      nilfs_sufile_segment_usages_per_block(sufile) -
69                      nilfs_sufile_get_offset(sufile, curr),
70                      max - curr + 1);
71 }
72
73 static struct nilfs_segment_usage *
74 nilfs_sufile_block_get_segment_usage(const struct inode *sufile, __u64 segnum,
75                                      struct buffer_head *bh, void *kaddr)
76 {
77         return kaddr + bh_offset(bh) +
78                 nilfs_sufile_get_offset(sufile, segnum) *
79                 NILFS_MDT(sufile)->mi_entry_size;
80 }
81
82 static inline int nilfs_sufile_get_header_block(struct inode *sufile,
83                                                 struct buffer_head **bhp)
84 {
85         return nilfs_mdt_get_block(sufile, 0, 0, NULL, bhp);
86 }
87
88 static inline int
89 nilfs_sufile_get_segment_usage_block(struct inode *sufile, __u64 segnum,
90                                      int create, struct buffer_head **bhp)
91 {
92         return nilfs_mdt_get_block(sufile,
93                                    nilfs_sufile_get_blkoff(sufile, segnum),
94                                    create, NULL, bhp);
95 }
96
97 static int nilfs_sufile_delete_segment_usage_block(struct inode *sufile,
98                                                    __u64 segnum)
99 {
100         return nilfs_mdt_delete_block(sufile,
101                                       nilfs_sufile_get_blkoff(sufile, segnum));
102 }
103
104 static void nilfs_sufile_mod_counter(struct buffer_head *header_bh,
105                                      u64 ncleanadd, u64 ndirtyadd)
106 {
107         struct nilfs_sufile_header *header;
108         void *kaddr;
109
110         kaddr = kmap_atomic(header_bh->b_page);
111         header = kaddr + bh_offset(header_bh);
112         le64_add_cpu(&header->sh_ncleansegs, ncleanadd);
113         le64_add_cpu(&header->sh_ndirtysegs, ndirtyadd);
114         kunmap_atomic(kaddr);
115
116         mark_buffer_dirty(header_bh);
117 }
118
119 /**
120  * nilfs_sufile_get_ncleansegs - return the number of clean segments
121  * @sufile: inode of segment usage file
122  */
123 unsigned long nilfs_sufile_get_ncleansegs(struct inode *sufile)
124 {
125         return NILFS_SUI(sufile)->ncleansegs;
126 }
127
128 /**
129  * nilfs_sufile_updatev - modify multiple segment usages at a time
130  * @sufile: inode of segment usage file
131  * @segnumv: array of segment numbers
132  * @nsegs: size of @segnumv array
133  * @create: creation flag
134  * @ndone: place to store number of modified segments on @segnumv
135  * @dofunc: primitive operation for the update
136  *
137  * Description: nilfs_sufile_updatev() repeatedly calls @dofunc
138  * against the given array of segments.  The @dofunc is called with
139  * buffers of a header block and the sufile block in which the target
140  * segment usage entry is contained.  If @ndone is given, the number
141  * of successfully modified segments from the head is stored in the
142  * place @ndone points to.
143  *
144  * Return Value: On success, zero is returned.  On error, one of the
145  * following negative error codes is returned.
146  *
147  * %-EIO - I/O error.
148  *
149  * %-ENOMEM - Insufficient amount of memory available.
150  *
151  * %-ENOENT - Given segment usage is in hole block (may be returned if
152  *            @create is zero)
153  *
154  * %-EINVAL - Invalid segment usage number
155  */
156 int nilfs_sufile_updatev(struct inode *sufile, __u64 *segnumv, size_t nsegs,
157                          int create, size_t *ndone,
158                          void (*dofunc)(struct inode *, __u64,
159                                         struct buffer_head *,
160                                         struct buffer_head *))
161 {
162         struct buffer_head *header_bh, *bh;
163         unsigned long blkoff, prev_blkoff;
164         __u64 *seg;
165         size_t nerr = 0, n = 0;
166         int ret = 0;
167
168         if (unlikely(nsegs == 0))
169                 goto out;
170
171         down_write(&NILFS_MDT(sufile)->mi_sem);
172         for (seg = segnumv; seg < segnumv + nsegs; seg++) {
173                 if (unlikely(*seg >= nilfs_sufile_get_nsegments(sufile))) {
174                         nilfs_warn(sufile->i_sb,
175                                    "%s: invalid segment number: %llu",
176                                    __func__, (unsigned long long)*seg);
177                         nerr++;
178                 }
179         }
180         if (nerr > 0) {
181                 ret = -EINVAL;
182                 goto out_sem;
183         }
184
185         ret = nilfs_sufile_get_header_block(sufile, &header_bh);
186         if (ret < 0)
187                 goto out_sem;
188
189         seg = segnumv;
190         blkoff = nilfs_sufile_get_blkoff(sufile, *seg);
191         ret = nilfs_mdt_get_block(sufile, blkoff, create, NULL, &bh);
192         if (ret < 0)
193                 goto out_header;
194
195         for (;;) {
196                 dofunc(sufile, *seg, header_bh, bh);
197
198                 if (++seg >= segnumv + nsegs)
199                         break;
200                 prev_blkoff = blkoff;
201                 blkoff = nilfs_sufile_get_blkoff(sufile, *seg);
202                 if (blkoff == prev_blkoff)
203                         continue;
204
205                 /* get different block */
206                 brelse(bh);
207                 ret = nilfs_mdt_get_block(sufile, blkoff, create, NULL, &bh);
208                 if (unlikely(ret < 0))
209                         goto out_header;
210         }
211         brelse(bh);
212
213  out_header:
214         n = seg - segnumv;
215         brelse(header_bh);
216  out_sem:
217         up_write(&NILFS_MDT(sufile)->mi_sem);
218  out:
219         if (ndone)
220                 *ndone = n;
221         return ret;
222 }
223
224 int nilfs_sufile_update(struct inode *sufile, __u64 segnum, int create,
225                         void (*dofunc)(struct inode *, __u64,
226                                        struct buffer_head *,
227                                        struct buffer_head *))
228 {
229         struct buffer_head *header_bh, *bh;
230         int ret;
231
232         if (unlikely(segnum >= nilfs_sufile_get_nsegments(sufile))) {
233                 nilfs_warn(sufile->i_sb, "%s: invalid segment number: %llu",
234                            __func__, (unsigned long long)segnum);
235                 return -EINVAL;
236         }
237         down_write(&NILFS_MDT(sufile)->mi_sem);
238
239         ret = nilfs_sufile_get_header_block(sufile, &header_bh);
240         if (ret < 0)
241                 goto out_sem;
242
243         ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, create, &bh);
244         if (!ret) {
245                 dofunc(sufile, segnum, header_bh, bh);
246                 brelse(bh);
247         }
248         brelse(header_bh);
249
250  out_sem:
251         up_write(&NILFS_MDT(sufile)->mi_sem);
252         return ret;
253 }
254
255 /**
256  * nilfs_sufile_set_alloc_range - limit range of segment to be allocated
257  * @sufile: inode of segment usage file
258  * @start: minimum segment number of allocatable region (inclusive)
259  * @end: maximum segment number of allocatable region (inclusive)
260  *
261  * Return Value: On success, 0 is returned.  On error, one of the
262  * following negative error codes is returned.
263  *
264  * %-ERANGE - invalid segment region
265  */
266 int nilfs_sufile_set_alloc_range(struct inode *sufile, __u64 start, __u64 end)
267 {
268         struct nilfs_sufile_info *sui = NILFS_SUI(sufile);
269         __u64 nsegs;
270         int ret = -ERANGE;
271
272         down_write(&NILFS_MDT(sufile)->mi_sem);
273         nsegs = nilfs_sufile_get_nsegments(sufile);
274
275         if (start <= end && end < nsegs) {
276                 sui->allocmin = start;
277                 sui->allocmax = end;
278                 ret = 0;
279         }
280         up_write(&NILFS_MDT(sufile)->mi_sem);
281         return ret;
282 }
283
284 /**
285  * nilfs_sufile_alloc - allocate a segment
286  * @sufile: inode of segment usage file
287  * @segnump: pointer to segment number
288  *
289  * Description: nilfs_sufile_alloc() allocates a clean segment.
290  *
291  * Return Value: On success, 0 is returned and the segment number of the
292  * allocated segment is stored in the place pointed by @segnump. On error, one
293  * of the following negative error codes is returned.
294  *
295  * %-EIO - I/O error.
296  *
297  * %-ENOMEM - Insufficient amount of memory available.
298  *
299  * %-ENOSPC - No clean segment left.
300  */
301 int nilfs_sufile_alloc(struct inode *sufile, __u64 *segnump)
302 {
303         struct buffer_head *header_bh, *su_bh;
304         struct nilfs_sufile_header *header;
305         struct nilfs_segment_usage *su;
306         struct nilfs_sufile_info *sui = NILFS_SUI(sufile);
307         size_t susz = NILFS_MDT(sufile)->mi_entry_size;
308         __u64 segnum, maxsegnum, last_alloc;
309         void *kaddr;
310         unsigned long nsegments, nsus, cnt;
311         int ret, j;
312
313         down_write(&NILFS_MDT(sufile)->mi_sem);
314
315         ret = nilfs_sufile_get_header_block(sufile, &header_bh);
316         if (ret < 0)
317                 goto out_sem;
318         kaddr = kmap_atomic(header_bh->b_page);
319         header = kaddr + bh_offset(header_bh);
320         last_alloc = le64_to_cpu(header->sh_last_alloc);
321         kunmap_atomic(kaddr);
322
323         nsegments = nilfs_sufile_get_nsegments(sufile);
324         maxsegnum = sui->allocmax;
325         segnum = last_alloc + 1;
326         if (segnum < sui->allocmin || segnum > sui->allocmax)
327                 segnum = sui->allocmin;
328
329         for (cnt = 0; cnt < nsegments; cnt += nsus) {
330                 if (segnum > maxsegnum) {
331                         if (cnt < sui->allocmax - sui->allocmin + 1) {
332                                 /*
333                                  * wrap around in the limited region.
334                                  * if allocation started from
335                                  * sui->allocmin, this never happens.
336                                  */
337                                 segnum = sui->allocmin;
338                                 maxsegnum = last_alloc;
339                         } else if (segnum > sui->allocmin &&
340                                    sui->allocmax + 1 < nsegments) {
341                                 segnum = sui->allocmax + 1;
342                                 maxsegnum = nsegments - 1;
343                         } else if (sui->allocmin > 0)  {
344                                 segnum = 0;
345                                 maxsegnum = sui->allocmin - 1;
346                         } else {
347                                 break; /* never happens */
348                         }
349                 }
350                 trace_nilfs2_segment_usage_check(sufile, segnum, cnt);
351                 ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 1,
352                                                            &su_bh);
353                 if (ret < 0)
354                         goto out_header;
355                 kaddr = kmap_atomic(su_bh->b_page);
356                 su = nilfs_sufile_block_get_segment_usage(
357                         sufile, segnum, su_bh, kaddr);
358
359                 nsus = nilfs_sufile_segment_usages_in_block(
360                         sufile, segnum, maxsegnum);
361                 for (j = 0; j < nsus; j++, su = (void *)su + susz, segnum++) {
362                         if (!nilfs_segment_usage_clean(su))
363                                 continue;
364                         /* found a clean segment */
365                         nilfs_segment_usage_set_dirty(su);
366                         kunmap_atomic(kaddr);
367
368                         kaddr = kmap_atomic(header_bh->b_page);
369                         header = kaddr + bh_offset(header_bh);
370                         le64_add_cpu(&header->sh_ncleansegs, -1);
371                         le64_add_cpu(&header->sh_ndirtysegs, 1);
372                         header->sh_last_alloc = cpu_to_le64(segnum);
373                         kunmap_atomic(kaddr);
374
375                         sui->ncleansegs--;
376                         mark_buffer_dirty(header_bh);
377                         mark_buffer_dirty(su_bh);
378                         nilfs_mdt_mark_dirty(sufile);
379                         brelse(su_bh);
380                         *segnump = segnum;
381
382                         trace_nilfs2_segment_usage_allocated(sufile, segnum);
383
384                         goto out_header;
385                 }
386
387                 kunmap_atomic(kaddr);
388                 brelse(su_bh);
389         }
390
391         /* no segments left */
392         ret = -ENOSPC;
393
394  out_header:
395         brelse(header_bh);
396
397  out_sem:
398         up_write(&NILFS_MDT(sufile)->mi_sem);
399         return ret;
400 }
401
402 void nilfs_sufile_do_cancel_free(struct inode *sufile, __u64 segnum,
403                                  struct buffer_head *header_bh,
404                                  struct buffer_head *su_bh)
405 {
406         struct nilfs_segment_usage *su;
407         void *kaddr;
408
409         kaddr = kmap_atomic(su_bh->b_page);
410         su = nilfs_sufile_block_get_segment_usage(sufile, segnum, su_bh, kaddr);
411         if (unlikely(!nilfs_segment_usage_clean(su))) {
412                 nilfs_warn(sufile->i_sb, "%s: segment %llu must be clean",
413                            __func__, (unsigned long long)segnum);
414                 kunmap_atomic(kaddr);
415                 return;
416         }
417         nilfs_segment_usage_set_dirty(su);
418         kunmap_atomic(kaddr);
419
420         nilfs_sufile_mod_counter(header_bh, -1, 1);
421         NILFS_SUI(sufile)->ncleansegs--;
422
423         mark_buffer_dirty(su_bh);
424         nilfs_mdt_mark_dirty(sufile);
425 }
426
427 void nilfs_sufile_do_scrap(struct inode *sufile, __u64 segnum,
428                            struct buffer_head *header_bh,
429                            struct buffer_head *su_bh)
430 {
431         struct nilfs_segment_usage *su;
432         void *kaddr;
433         int clean, dirty;
434
435         kaddr = kmap_atomic(su_bh->b_page);
436         su = nilfs_sufile_block_get_segment_usage(sufile, segnum, su_bh, kaddr);
437         if (su->su_flags == cpu_to_le32(BIT(NILFS_SEGMENT_USAGE_DIRTY)) &&
438             su->su_nblocks == cpu_to_le32(0)) {
439                 kunmap_atomic(kaddr);
440                 return;
441         }
442         clean = nilfs_segment_usage_clean(su);
443         dirty = nilfs_segment_usage_dirty(su);
444
445         /* make the segment garbage */
446         su->su_lastmod = cpu_to_le64(0);
447         su->su_nblocks = cpu_to_le32(0);
448         su->su_flags = cpu_to_le32(BIT(NILFS_SEGMENT_USAGE_DIRTY));
449         kunmap_atomic(kaddr);
450
451         nilfs_sufile_mod_counter(header_bh, clean ? (u64)-1 : 0, dirty ? 0 : 1);
452         NILFS_SUI(sufile)->ncleansegs -= clean;
453
454         mark_buffer_dirty(su_bh);
455         nilfs_mdt_mark_dirty(sufile);
456 }
457
458 void nilfs_sufile_do_free(struct inode *sufile, __u64 segnum,
459                           struct buffer_head *header_bh,
460                           struct buffer_head *su_bh)
461 {
462         struct nilfs_segment_usage *su;
463         void *kaddr;
464         int sudirty;
465
466         kaddr = kmap_atomic(su_bh->b_page);
467         su = nilfs_sufile_block_get_segment_usage(sufile, segnum, su_bh, kaddr);
468         if (nilfs_segment_usage_clean(su)) {
469                 nilfs_warn(sufile->i_sb, "%s: segment %llu is already clean",
470                            __func__, (unsigned long long)segnum);
471                 kunmap_atomic(kaddr);
472                 return;
473         }
474         WARN_ON(nilfs_segment_usage_error(su));
475         WARN_ON(!nilfs_segment_usage_dirty(su));
476
477         sudirty = nilfs_segment_usage_dirty(su);
478         nilfs_segment_usage_set_clean(su);
479         kunmap_atomic(kaddr);
480         mark_buffer_dirty(su_bh);
481
482         nilfs_sufile_mod_counter(header_bh, 1, sudirty ? (u64)-1 : 0);
483         NILFS_SUI(sufile)->ncleansegs++;
484
485         nilfs_mdt_mark_dirty(sufile);
486
487         trace_nilfs2_segment_usage_freed(sufile, segnum);
488 }
489
490 /**
491  * nilfs_sufile_mark_dirty - mark the buffer having a segment usage dirty
492  * @sufile: inode of segment usage file
493  * @segnum: segment number
494  */
495 int nilfs_sufile_mark_dirty(struct inode *sufile, __u64 segnum)
496 {
497         struct buffer_head *bh;
498         void *kaddr;
499         struct nilfs_segment_usage *su;
500         int ret;
501
502         down_write(&NILFS_MDT(sufile)->mi_sem);
503         ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0, &bh);
504         if (!ret) {
505                 mark_buffer_dirty(bh);
506                 nilfs_mdt_mark_dirty(sufile);
507                 kaddr = kmap_atomic(bh->b_page);
508                 su = nilfs_sufile_block_get_segment_usage(sufile, segnum, bh, kaddr);
509                 nilfs_segment_usage_set_dirty(su);
510                 kunmap_atomic(kaddr);
511                 brelse(bh);
512         }
513         up_write(&NILFS_MDT(sufile)->mi_sem);
514         return ret;
515 }
516
517 /**
518  * nilfs_sufile_set_segment_usage - set usage of a segment
519  * @sufile: inode of segment usage file
520  * @segnum: segment number
521  * @nblocks: number of live blocks in the segment
522  * @modtime: modification time (option)
523  */
524 int nilfs_sufile_set_segment_usage(struct inode *sufile, __u64 segnum,
525                                    unsigned long nblocks, time64_t modtime)
526 {
527         struct buffer_head *bh;
528         struct nilfs_segment_usage *su;
529         void *kaddr;
530         int ret;
531
532         down_write(&NILFS_MDT(sufile)->mi_sem);
533         ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0, &bh);
534         if (ret < 0)
535                 goto out_sem;
536
537         kaddr = kmap_atomic(bh->b_page);
538         su = nilfs_sufile_block_get_segment_usage(sufile, segnum, bh, kaddr);
539         WARN_ON(nilfs_segment_usage_error(su));
540         if (modtime)
541                 su->su_lastmod = cpu_to_le64(modtime);
542         su->su_nblocks = cpu_to_le32(nblocks);
543         kunmap_atomic(kaddr);
544
545         mark_buffer_dirty(bh);
546         nilfs_mdt_mark_dirty(sufile);
547         brelse(bh);
548
549  out_sem:
550         up_write(&NILFS_MDT(sufile)->mi_sem);
551         return ret;
552 }
553
554 /**
555  * nilfs_sufile_get_stat - get segment usage statistics
556  * @sufile: inode of segment usage file
557  * @sustat: pointer to a structure of segment usage statistics
558  *
559  * Description: nilfs_sufile_get_stat() returns information about segment
560  * usage.
561  *
562  * Return Value: On success, 0 is returned, and segment usage information is
563  * stored in the place pointed by @sustat. On error, one of the following
564  * negative error codes is returned.
565  *
566  * %-EIO - I/O error.
567  *
568  * %-ENOMEM - Insufficient amount of memory available.
569  */
570 int nilfs_sufile_get_stat(struct inode *sufile, struct nilfs_sustat *sustat)
571 {
572         struct buffer_head *header_bh;
573         struct nilfs_sufile_header *header;
574         struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
575         void *kaddr;
576         int ret;
577
578         down_read(&NILFS_MDT(sufile)->mi_sem);
579
580         ret = nilfs_sufile_get_header_block(sufile, &header_bh);
581         if (ret < 0)
582                 goto out_sem;
583
584         kaddr = kmap_atomic(header_bh->b_page);
585         header = kaddr + bh_offset(header_bh);
586         sustat->ss_nsegs = nilfs_sufile_get_nsegments(sufile);
587         sustat->ss_ncleansegs = le64_to_cpu(header->sh_ncleansegs);
588         sustat->ss_ndirtysegs = le64_to_cpu(header->sh_ndirtysegs);
589         sustat->ss_ctime = nilfs->ns_ctime;
590         sustat->ss_nongc_ctime = nilfs->ns_nongc_ctime;
591         spin_lock(&nilfs->ns_last_segment_lock);
592         sustat->ss_prot_seq = nilfs->ns_prot_seq;
593         spin_unlock(&nilfs->ns_last_segment_lock);
594         kunmap_atomic(kaddr);
595         brelse(header_bh);
596
597  out_sem:
598         up_read(&NILFS_MDT(sufile)->mi_sem);
599         return ret;
600 }
601
602 void nilfs_sufile_do_set_error(struct inode *sufile, __u64 segnum,
603                                struct buffer_head *header_bh,
604                                struct buffer_head *su_bh)
605 {
606         struct nilfs_segment_usage *su;
607         void *kaddr;
608         int suclean;
609
610         kaddr = kmap_atomic(su_bh->b_page);
611         su = nilfs_sufile_block_get_segment_usage(sufile, segnum, su_bh, kaddr);
612         if (nilfs_segment_usage_error(su)) {
613                 kunmap_atomic(kaddr);
614                 return;
615         }
616         suclean = nilfs_segment_usage_clean(su);
617         nilfs_segment_usage_set_error(su);
618         kunmap_atomic(kaddr);
619
620         if (suclean) {
621                 nilfs_sufile_mod_counter(header_bh, -1, 0);
622                 NILFS_SUI(sufile)->ncleansegs--;
623         }
624         mark_buffer_dirty(su_bh);
625         nilfs_mdt_mark_dirty(sufile);
626 }
627
628 /**
629  * nilfs_sufile_truncate_range - truncate range of segment array
630  * @sufile: inode of segment usage file
631  * @start: start segment number (inclusive)
632  * @end: end segment number (inclusive)
633  *
634  * Return Value: On success, 0 is returned.  On error, one of the
635  * following negative error codes is returned.
636  *
637  * %-EIO - I/O error.
638  *
639  * %-ENOMEM - Insufficient amount of memory available.
640  *
641  * %-EINVAL - Invalid number of segments specified
642  *
643  * %-EBUSY - Dirty or active segments are present in the range
644  */
645 static int nilfs_sufile_truncate_range(struct inode *sufile,
646                                        __u64 start, __u64 end)
647 {
648         struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
649         struct buffer_head *header_bh;
650         struct buffer_head *su_bh;
651         struct nilfs_segment_usage *su, *su2;
652         size_t susz = NILFS_MDT(sufile)->mi_entry_size;
653         unsigned long segusages_per_block;
654         unsigned long nsegs, ncleaned;
655         __u64 segnum;
656         void *kaddr;
657         ssize_t n, nc;
658         int ret;
659         int j;
660
661         nsegs = nilfs_sufile_get_nsegments(sufile);
662
663         ret = -EINVAL;
664         if (start > end || start >= nsegs)
665                 goto out;
666
667         ret = nilfs_sufile_get_header_block(sufile, &header_bh);
668         if (ret < 0)
669                 goto out;
670
671         segusages_per_block = nilfs_sufile_segment_usages_per_block(sufile);
672         ncleaned = 0;
673
674         for (segnum = start; segnum <= end; segnum += n) {
675                 n = min_t(unsigned long,
676                           segusages_per_block -
677                                   nilfs_sufile_get_offset(sufile, segnum),
678                           end - segnum + 1);
679                 ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0,
680                                                            &su_bh);
681                 if (ret < 0) {
682                         if (ret != -ENOENT)
683                                 goto out_header;
684                         /* hole */
685                         continue;
686                 }
687                 kaddr = kmap_atomic(su_bh->b_page);
688                 su = nilfs_sufile_block_get_segment_usage(
689                         sufile, segnum, su_bh, kaddr);
690                 su2 = su;
691                 for (j = 0; j < n; j++, su = (void *)su + susz) {
692                         if ((le32_to_cpu(su->su_flags) &
693                              ~BIT(NILFS_SEGMENT_USAGE_ERROR)) ||
694                             nilfs_segment_is_active(nilfs, segnum + j)) {
695                                 ret = -EBUSY;
696                                 kunmap_atomic(kaddr);
697                                 brelse(su_bh);
698                                 goto out_header;
699                         }
700                 }
701                 nc = 0;
702                 for (su = su2, j = 0; j < n; j++, su = (void *)su + susz) {
703                         if (nilfs_segment_usage_error(su)) {
704                                 nilfs_segment_usage_set_clean(su);
705                                 nc++;
706                         }
707                 }
708                 kunmap_atomic(kaddr);
709                 if (nc > 0) {
710                         mark_buffer_dirty(su_bh);
711                         ncleaned += nc;
712                 }
713                 brelse(su_bh);
714
715                 if (n == segusages_per_block) {
716                         /* make hole */
717                         nilfs_sufile_delete_segment_usage_block(sufile, segnum);
718                 }
719         }
720         ret = 0;
721
722 out_header:
723         if (ncleaned > 0) {
724                 NILFS_SUI(sufile)->ncleansegs += ncleaned;
725                 nilfs_sufile_mod_counter(header_bh, ncleaned, 0);
726                 nilfs_mdt_mark_dirty(sufile);
727         }
728         brelse(header_bh);
729 out:
730         return ret;
731 }
732
733 /**
734  * nilfs_sufile_resize - resize segment array
735  * @sufile: inode of segment usage file
736  * @newnsegs: new number of segments
737  *
738  * Return Value: On success, 0 is returned.  On error, one of the
739  * following negative error codes is returned.
740  *
741  * %-EIO - I/O error.
742  *
743  * %-ENOMEM - Insufficient amount of memory available.
744  *
745  * %-ENOSPC - Enough free space is not left for shrinking
746  *
747  * %-EBUSY - Dirty or active segments exist in the region to be truncated
748  */
749 int nilfs_sufile_resize(struct inode *sufile, __u64 newnsegs)
750 {
751         struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
752         struct buffer_head *header_bh;
753         struct nilfs_sufile_header *header;
754         struct nilfs_sufile_info *sui = NILFS_SUI(sufile);
755         void *kaddr;
756         unsigned long nsegs, nrsvsegs;
757         int ret = 0;
758
759         down_write(&NILFS_MDT(sufile)->mi_sem);
760
761         nsegs = nilfs_sufile_get_nsegments(sufile);
762         if (nsegs == newnsegs)
763                 goto out;
764
765         ret = -ENOSPC;
766         nrsvsegs = nilfs_nrsvsegs(nilfs, newnsegs);
767         if (newnsegs < nsegs && nsegs - newnsegs + nrsvsegs > sui->ncleansegs)
768                 goto out;
769
770         ret = nilfs_sufile_get_header_block(sufile, &header_bh);
771         if (ret < 0)
772                 goto out;
773
774         if (newnsegs > nsegs) {
775                 sui->ncleansegs += newnsegs - nsegs;
776         } else /* newnsegs < nsegs */ {
777                 ret = nilfs_sufile_truncate_range(sufile, newnsegs, nsegs - 1);
778                 if (ret < 0)
779                         goto out_header;
780
781                 sui->ncleansegs -= nsegs - newnsegs;
782
783                 /*
784                  * If the sufile is successfully truncated, immediately adjust
785                  * the segment allocation space while locking the semaphore
786                  * "mi_sem" so that nilfs_sufile_alloc() never allocates
787                  * segments in the truncated space.
788                  */
789                 sui->allocmax = newnsegs - 1;
790                 sui->allocmin = 0;
791         }
792
793         kaddr = kmap_atomic(header_bh->b_page);
794         header = kaddr + bh_offset(header_bh);
795         header->sh_ncleansegs = cpu_to_le64(sui->ncleansegs);
796         kunmap_atomic(kaddr);
797
798         mark_buffer_dirty(header_bh);
799         nilfs_mdt_mark_dirty(sufile);
800         nilfs_set_nsegments(nilfs, newnsegs);
801
802 out_header:
803         brelse(header_bh);
804 out:
805         up_write(&NILFS_MDT(sufile)->mi_sem);
806         return ret;
807 }
808
809 /**
810  * nilfs_sufile_get_suinfo -
811  * @sufile: inode of segment usage file
812  * @segnum: segment number to start looking
813  * @buf: array of suinfo
814  * @sisz: byte size of suinfo
815  * @nsi: size of suinfo array
816  *
817  * Description:
818  *
819  * Return Value: On success, 0 is returned and .... On error, one of the
820  * following negative error codes is returned.
821  *
822  * %-EIO - I/O error.
823  *
824  * %-ENOMEM - Insufficient amount of memory available.
825  */
826 ssize_t nilfs_sufile_get_suinfo(struct inode *sufile, __u64 segnum, void *buf,
827                                 unsigned int sisz, size_t nsi)
828 {
829         struct buffer_head *su_bh;
830         struct nilfs_segment_usage *su;
831         struct nilfs_suinfo *si = buf;
832         size_t susz = NILFS_MDT(sufile)->mi_entry_size;
833         struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
834         void *kaddr;
835         unsigned long nsegs, segusages_per_block;
836         ssize_t n;
837         int ret, i, j;
838
839         down_read(&NILFS_MDT(sufile)->mi_sem);
840
841         segusages_per_block = nilfs_sufile_segment_usages_per_block(sufile);
842         nsegs = min_t(unsigned long,
843                       nilfs_sufile_get_nsegments(sufile) - segnum,
844                       nsi);
845         for (i = 0; i < nsegs; i += n, segnum += n) {
846                 n = min_t(unsigned long,
847                           segusages_per_block -
848                                   nilfs_sufile_get_offset(sufile, segnum),
849                           nsegs - i);
850                 ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0,
851                                                            &su_bh);
852                 if (ret < 0) {
853                         if (ret != -ENOENT)
854                                 goto out;
855                         /* hole */
856                         memset(si, 0, sisz * n);
857                         si = (void *)si + sisz * n;
858                         continue;
859                 }
860
861                 kaddr = kmap_atomic(su_bh->b_page);
862                 su = nilfs_sufile_block_get_segment_usage(
863                         sufile, segnum, su_bh, kaddr);
864                 for (j = 0; j < n;
865                      j++, su = (void *)su + susz, si = (void *)si + sisz) {
866                         si->sui_lastmod = le64_to_cpu(su->su_lastmod);
867                         si->sui_nblocks = le32_to_cpu(su->su_nblocks);
868                         si->sui_flags = le32_to_cpu(su->su_flags) &
869                                 ~BIT(NILFS_SEGMENT_USAGE_ACTIVE);
870                         if (nilfs_segment_is_active(nilfs, segnum + j))
871                                 si->sui_flags |=
872                                         BIT(NILFS_SEGMENT_USAGE_ACTIVE);
873                 }
874                 kunmap_atomic(kaddr);
875                 brelse(su_bh);
876         }
877         ret = nsegs;
878
879  out:
880         up_read(&NILFS_MDT(sufile)->mi_sem);
881         return ret;
882 }
883
884 /**
885  * nilfs_sufile_set_suinfo - sets segment usage info
886  * @sufile: inode of segment usage file
887  * @buf: array of suinfo_update
888  * @supsz: byte size of suinfo_update
889  * @nsup: size of suinfo_update array
890  *
891  * Description: Takes an array of nilfs_suinfo_update structs and updates
892  * segment usage accordingly. Only the fields indicated by the sup_flags
893  * are updated.
894  *
895  * Return Value: On success, 0 is returned. On error, one of the
896  * following negative error codes is returned.
897  *
898  * %-EIO - I/O error.
899  *
900  * %-ENOMEM - Insufficient amount of memory available.
901  *
902  * %-EINVAL - Invalid values in input (segment number, flags or nblocks)
903  */
904 ssize_t nilfs_sufile_set_suinfo(struct inode *sufile, void *buf,
905                                 unsigned int supsz, size_t nsup)
906 {
907         struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
908         struct buffer_head *header_bh, *bh;
909         struct nilfs_suinfo_update *sup, *supend = buf + supsz * nsup;
910         struct nilfs_segment_usage *su;
911         void *kaddr;
912         unsigned long blkoff, prev_blkoff;
913         int cleansi, cleansu, dirtysi, dirtysu;
914         long ncleaned = 0, ndirtied = 0;
915         int ret = 0;
916
917         if (unlikely(nsup == 0))
918                 return ret;
919
920         for (sup = buf; sup < supend; sup = (void *)sup + supsz) {
921                 if (sup->sup_segnum >= nilfs->ns_nsegments
922                         || (sup->sup_flags &
923                                 (~0UL << __NR_NILFS_SUINFO_UPDATE_FIELDS))
924                         || (nilfs_suinfo_update_nblocks(sup) &&
925                                 sup->sup_sui.sui_nblocks >
926                                 nilfs->ns_blocks_per_segment))
927                         return -EINVAL;
928         }
929
930         down_write(&NILFS_MDT(sufile)->mi_sem);
931
932         ret = nilfs_sufile_get_header_block(sufile, &header_bh);
933         if (ret < 0)
934                 goto out_sem;
935
936         sup = buf;
937         blkoff = nilfs_sufile_get_blkoff(sufile, sup->sup_segnum);
938         ret = nilfs_mdt_get_block(sufile, blkoff, 1, NULL, &bh);
939         if (ret < 0)
940                 goto out_header;
941
942         for (;;) {
943                 kaddr = kmap_atomic(bh->b_page);
944                 su = nilfs_sufile_block_get_segment_usage(
945                         sufile, sup->sup_segnum, bh, kaddr);
946
947                 if (nilfs_suinfo_update_lastmod(sup))
948                         su->su_lastmod = cpu_to_le64(sup->sup_sui.sui_lastmod);
949
950                 if (nilfs_suinfo_update_nblocks(sup))
951                         su->su_nblocks = cpu_to_le32(sup->sup_sui.sui_nblocks);
952
953                 if (nilfs_suinfo_update_flags(sup)) {
954                         /*
955                          * Active flag is a virtual flag projected by running
956                          * nilfs kernel code - drop it not to write it to
957                          * disk.
958                          */
959                         sup->sup_sui.sui_flags &=
960                                         ~BIT(NILFS_SEGMENT_USAGE_ACTIVE);
961
962                         cleansi = nilfs_suinfo_clean(&sup->sup_sui);
963                         cleansu = nilfs_segment_usage_clean(su);
964                         dirtysi = nilfs_suinfo_dirty(&sup->sup_sui);
965                         dirtysu = nilfs_segment_usage_dirty(su);
966
967                         if (cleansi && !cleansu)
968                                 ++ncleaned;
969                         else if (!cleansi && cleansu)
970                                 --ncleaned;
971
972                         if (dirtysi && !dirtysu)
973                                 ++ndirtied;
974                         else if (!dirtysi && dirtysu)
975                                 --ndirtied;
976
977                         su->su_flags = cpu_to_le32(sup->sup_sui.sui_flags);
978                 }
979
980                 kunmap_atomic(kaddr);
981
982                 sup = (void *)sup + supsz;
983                 if (sup >= supend)
984                         break;
985
986                 prev_blkoff = blkoff;
987                 blkoff = nilfs_sufile_get_blkoff(sufile, sup->sup_segnum);
988                 if (blkoff == prev_blkoff)
989                         continue;
990
991                 /* get different block */
992                 mark_buffer_dirty(bh);
993                 put_bh(bh);
994                 ret = nilfs_mdt_get_block(sufile, blkoff, 1, NULL, &bh);
995                 if (unlikely(ret < 0))
996                         goto out_mark;
997         }
998         mark_buffer_dirty(bh);
999         put_bh(bh);
1000
1001  out_mark:
1002         if (ncleaned || ndirtied) {
1003                 nilfs_sufile_mod_counter(header_bh, (u64)ncleaned,
1004                                 (u64)ndirtied);
1005                 NILFS_SUI(sufile)->ncleansegs += ncleaned;
1006         }
1007         nilfs_mdt_mark_dirty(sufile);
1008  out_header:
1009         put_bh(header_bh);
1010  out_sem:
1011         up_write(&NILFS_MDT(sufile)->mi_sem);
1012         return ret;
1013 }
1014
1015 /**
1016  * nilfs_sufile_trim_fs() - trim ioctl handle function
1017  * @sufile: inode of segment usage file
1018  * @range: fstrim_range structure
1019  *
1020  * start:       First Byte to trim
1021  * len:         number of Bytes to trim from start
1022  * minlen:      minimum extent length in Bytes
1023  *
1024  * Decription: nilfs_sufile_trim_fs goes through all segments containing bytes
1025  * from start to start+len. start is rounded up to the next block boundary
1026  * and start+len is rounded down. For each clean segment blkdev_issue_discard
1027  * function is invoked.
1028  *
1029  * Return Value: On success, 0 is returned or negative error code, otherwise.
1030  */
1031 int nilfs_sufile_trim_fs(struct inode *sufile, struct fstrim_range *range)
1032 {
1033         struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
1034         struct buffer_head *su_bh;
1035         struct nilfs_segment_usage *su;
1036         void *kaddr;
1037         size_t n, i, susz = NILFS_MDT(sufile)->mi_entry_size;
1038         sector_t seg_start, seg_end, start_block, end_block;
1039         sector_t start = 0, nblocks = 0;
1040         u64 segnum, segnum_end, minlen, len, max_blocks, ndiscarded = 0;
1041         int ret = 0;
1042         unsigned int sects_per_block;
1043
1044         sects_per_block = (1 << nilfs->ns_blocksize_bits) /
1045                         bdev_logical_block_size(nilfs->ns_bdev);
1046         len = range->len >> nilfs->ns_blocksize_bits;
1047         minlen = range->minlen >> nilfs->ns_blocksize_bits;
1048         max_blocks = ((u64)nilfs->ns_nsegments * nilfs->ns_blocks_per_segment);
1049
1050         if (!len || range->start >= max_blocks << nilfs->ns_blocksize_bits)
1051                 return -EINVAL;
1052
1053         start_block = (range->start + nilfs->ns_blocksize - 1) >>
1054                         nilfs->ns_blocksize_bits;
1055
1056         /*
1057          * range->len can be very large (actually, it is set to
1058          * ULLONG_MAX by default) - truncate upper end of the range
1059          * carefully so as not to overflow.
1060          */
1061         if (max_blocks - start_block < len)
1062                 end_block = max_blocks - 1;
1063         else
1064                 end_block = start_block + len - 1;
1065
1066         segnum = nilfs_get_segnum_of_block(nilfs, start_block);
1067         segnum_end = nilfs_get_segnum_of_block(nilfs, end_block);
1068
1069         down_read(&NILFS_MDT(sufile)->mi_sem);
1070
1071         while (segnum <= segnum_end) {
1072                 n = nilfs_sufile_segment_usages_in_block(sufile, segnum,
1073                                 segnum_end);
1074
1075                 ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0,
1076                                                            &su_bh);
1077                 if (ret < 0) {
1078                         if (ret != -ENOENT)
1079                                 goto out_sem;
1080                         /* hole */
1081                         segnum += n;
1082                         continue;
1083                 }
1084
1085                 kaddr = kmap_atomic(su_bh->b_page);
1086                 su = nilfs_sufile_block_get_segment_usage(sufile, segnum,
1087                                 su_bh, kaddr);
1088                 for (i = 0; i < n; ++i, ++segnum, su = (void *)su + susz) {
1089                         if (!nilfs_segment_usage_clean(su))
1090                                 continue;
1091
1092                         nilfs_get_segment_range(nilfs, segnum, &seg_start,
1093                                                 &seg_end);
1094
1095                         if (!nblocks) {
1096                                 /* start new extent */
1097                                 start = seg_start;
1098                                 nblocks = seg_end - seg_start + 1;
1099                                 continue;
1100                         }
1101
1102                         if (start + nblocks == seg_start) {
1103                                 /* add to previous extent */
1104                                 nblocks += seg_end - seg_start + 1;
1105                                 continue;
1106                         }
1107
1108                         /* discard previous extent */
1109                         if (start < start_block) {
1110                                 nblocks -= start_block - start;
1111                                 start = start_block;
1112                         }
1113
1114                         if (nblocks >= minlen) {
1115                                 kunmap_atomic(kaddr);
1116
1117                                 ret = blkdev_issue_discard(nilfs->ns_bdev,
1118                                                 start * sects_per_block,
1119                                                 nblocks * sects_per_block,
1120                                                 GFP_NOFS);
1121                                 if (ret < 0) {
1122                                         put_bh(su_bh);
1123                                         goto out_sem;
1124                                 }
1125
1126                                 ndiscarded += nblocks;
1127                                 kaddr = kmap_atomic(su_bh->b_page);
1128                                 su = nilfs_sufile_block_get_segment_usage(
1129                                         sufile, segnum, su_bh, kaddr);
1130                         }
1131
1132                         /* start new extent */
1133                         start = seg_start;
1134                         nblocks = seg_end - seg_start + 1;
1135                 }
1136                 kunmap_atomic(kaddr);
1137                 put_bh(su_bh);
1138         }
1139
1140
1141         if (nblocks) {
1142                 /* discard last extent */
1143                 if (start < start_block) {
1144                         nblocks -= start_block - start;
1145                         start = start_block;
1146                 }
1147                 if (start + nblocks > end_block + 1)
1148                         nblocks = end_block - start + 1;
1149
1150                 if (nblocks >= minlen) {
1151                         ret = blkdev_issue_discard(nilfs->ns_bdev,
1152                                         start * sects_per_block,
1153                                         nblocks * sects_per_block,
1154                                         GFP_NOFS);
1155                         if (!ret)
1156                                 ndiscarded += nblocks;
1157                 }
1158         }
1159
1160 out_sem:
1161         up_read(&NILFS_MDT(sufile)->mi_sem);
1162
1163         range->len = ndiscarded << nilfs->ns_blocksize_bits;
1164         return ret;
1165 }
1166
1167 /**
1168  * nilfs_sufile_read - read or get sufile inode
1169  * @sb: super block instance
1170  * @susize: size of a segment usage entry
1171  * @raw_inode: on-disk sufile inode
1172  * @inodep: buffer to store the inode
1173  */
1174 int nilfs_sufile_read(struct super_block *sb, size_t susize,
1175                       struct nilfs_inode *raw_inode, struct inode **inodep)
1176 {
1177         struct inode *sufile;
1178         struct nilfs_sufile_info *sui;
1179         struct buffer_head *header_bh;
1180         struct nilfs_sufile_header *header;
1181         void *kaddr;
1182         int err;
1183
1184         if (susize > sb->s_blocksize) {
1185                 nilfs_err(sb, "too large segment usage size: %zu bytes",
1186                           susize);
1187                 return -EINVAL;
1188         } else if (susize < NILFS_MIN_SEGMENT_USAGE_SIZE) {
1189                 nilfs_err(sb, "too small segment usage size: %zu bytes",
1190                           susize);
1191                 return -EINVAL;
1192         }
1193
1194         sufile = nilfs_iget_locked(sb, NULL, NILFS_SUFILE_INO);
1195         if (unlikely(!sufile))
1196                 return -ENOMEM;
1197         if (!(sufile->i_state & I_NEW))
1198                 goto out;
1199
1200         err = nilfs_mdt_init(sufile, NILFS_MDT_GFP, sizeof(*sui));
1201         if (err)
1202                 goto failed;
1203
1204         nilfs_mdt_set_entry_size(sufile, susize,
1205                                  sizeof(struct nilfs_sufile_header));
1206
1207         err = nilfs_read_inode_common(sufile, raw_inode);
1208         if (err)
1209                 goto failed;
1210
1211         err = nilfs_sufile_get_header_block(sufile, &header_bh);
1212         if (err)
1213                 goto failed;
1214
1215         sui = NILFS_SUI(sufile);
1216         kaddr = kmap_atomic(header_bh->b_page);
1217         header = kaddr + bh_offset(header_bh);
1218         sui->ncleansegs = le64_to_cpu(header->sh_ncleansegs);
1219         kunmap_atomic(kaddr);
1220         brelse(header_bh);
1221
1222         sui->allocmax = nilfs_sufile_get_nsegments(sufile) - 1;
1223         sui->allocmin = 0;
1224
1225         unlock_new_inode(sufile);
1226  out:
1227         *inodep = sufile;
1228         return 0;
1229  failed:
1230         iget_failed(sufile);
1231         return err;
1232 }