Merge tag 'kthread-cleanups-for-v5.19' of git://git.kernel.org/pub/scm/linux/kernel...
[linux-2.6-microblaze.git] / fs / ntfs3 / inode.c
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  *
4  * Copyright (C) 2019-2021 Paragon Software GmbH, All rights reserved.
5  *
6  */
7
8 #include <linux/buffer_head.h>
9 #include <linux/fs.h>
10 #include <linux/mpage.h>
11 #include <linux/namei.h>
12 #include <linux/nls.h>
13 #include <linux/uio.h>
14 #include <linux/writeback.h>
15
16 #include "debug.h"
17 #include "ntfs.h"
18 #include "ntfs_fs.h"
19
20 /*
21  * ntfs_read_mft - Read record and parses MFT.
22  */
23 static struct inode *ntfs_read_mft(struct inode *inode,
24                                    const struct cpu_str *name,
25                                    const struct MFT_REF *ref)
26 {
27         int err = 0;
28         struct ntfs_inode *ni = ntfs_i(inode);
29         struct super_block *sb = inode->i_sb;
30         struct ntfs_sb_info *sbi = sb->s_fs_info;
31         mode_t mode = 0;
32         struct ATTR_STD_INFO5 *std5 = NULL;
33         struct ATTR_LIST_ENTRY *le;
34         struct ATTRIB *attr;
35         bool is_match = false;
36         bool is_root = false;
37         bool is_dir;
38         unsigned long ino = inode->i_ino;
39         u32 rp_fa = 0, asize, t32;
40         u16 roff, rsize, names = 0;
41         const struct ATTR_FILE_NAME *fname = NULL;
42         const struct INDEX_ROOT *root;
43         struct REPARSE_DATA_BUFFER rp; // 0x18 bytes
44         u64 t64;
45         struct MFT_REC *rec;
46         struct runs_tree *run;
47
48         inode->i_op = NULL;
49         /* Setup 'uid' and 'gid' */
50         inode->i_uid = sbi->options->fs_uid;
51         inode->i_gid = sbi->options->fs_gid;
52
53         err = mi_init(&ni->mi, sbi, ino);
54         if (err)
55                 goto out;
56
57         if (!sbi->mft.ni && ino == MFT_REC_MFT && !sb->s_root) {
58                 t64 = sbi->mft.lbo >> sbi->cluster_bits;
59                 t32 = bytes_to_cluster(sbi, MFT_REC_VOL * sbi->record_size);
60                 sbi->mft.ni = ni;
61                 init_rwsem(&ni->file.run_lock);
62
63                 if (!run_add_entry(&ni->file.run, 0, t64, t32, true)) {
64                         err = -ENOMEM;
65                         goto out;
66                 }
67         }
68
69         err = mi_read(&ni->mi, ino == MFT_REC_MFT);
70
71         if (err)
72                 goto out;
73
74         rec = ni->mi.mrec;
75
76         if (sbi->flags & NTFS_FLAGS_LOG_REPLAYING) {
77                 ;
78         } else if (ref->seq != rec->seq) {
79                 err = -EINVAL;
80                 ntfs_err(sb, "MFT: r=%lx, expect seq=%x instead of %x!", ino,
81                          le16_to_cpu(ref->seq), le16_to_cpu(rec->seq));
82                 goto out;
83         } else if (!is_rec_inuse(rec)) {
84                 err = -EINVAL;
85                 ntfs_err(sb, "Inode r=%x is not in use!", (u32)ino);
86                 goto out;
87         }
88
89         if (le32_to_cpu(rec->total) != sbi->record_size) {
90                 /* Bad inode? */
91                 err = -EINVAL;
92                 goto out;
93         }
94
95         if (!is_rec_base(rec))
96                 goto Ok;
97
98         /* Record should contain $I30 root. */
99         is_dir = rec->flags & RECORD_FLAG_DIR;
100
101         inode->i_generation = le16_to_cpu(rec->seq);
102
103         /* Enumerate all struct Attributes MFT. */
104         le = NULL;
105         attr = NULL;
106
107         /*
108          * To reduce tab pressure use goto instead of
109          * while( (attr = ni_enum_attr_ex(ni, attr, &le, NULL) ))
110          */
111 next_attr:
112         run = NULL;
113         err = -EINVAL;
114         attr = ni_enum_attr_ex(ni, attr, &le, NULL);
115         if (!attr)
116                 goto end_enum;
117
118         if (le && le->vcn) {
119                 /* This is non primary attribute segment. Ignore if not MFT. */
120                 if (ino != MFT_REC_MFT || attr->type != ATTR_DATA)
121                         goto next_attr;
122
123                 run = &ni->file.run;
124                 asize = le32_to_cpu(attr->size);
125                 goto attr_unpack_run;
126         }
127
128         roff = attr->non_res ? 0 : le16_to_cpu(attr->res.data_off);
129         rsize = attr->non_res ? 0 : le32_to_cpu(attr->res.data_size);
130         asize = le32_to_cpu(attr->size);
131
132         switch (attr->type) {
133         case ATTR_STD:
134                 if (attr->non_res ||
135                     asize < sizeof(struct ATTR_STD_INFO) + roff ||
136                     rsize < sizeof(struct ATTR_STD_INFO))
137                         goto out;
138
139                 if (std5)
140                         goto next_attr;
141
142                 std5 = Add2Ptr(attr, roff);
143
144 #ifdef STATX_BTIME
145                 nt2kernel(std5->cr_time, &ni->i_crtime);
146 #endif
147                 nt2kernel(std5->a_time, &inode->i_atime);
148                 nt2kernel(std5->c_time, &inode->i_ctime);
149                 nt2kernel(std5->m_time, &inode->i_mtime);
150
151                 ni->std_fa = std5->fa;
152
153                 if (asize >= sizeof(struct ATTR_STD_INFO5) + roff &&
154                     rsize >= sizeof(struct ATTR_STD_INFO5))
155                         ni->std_security_id = std5->security_id;
156                 goto next_attr;
157
158         case ATTR_LIST:
159                 if (attr->name_len || le || ino == MFT_REC_LOG)
160                         goto out;
161
162                 err = ntfs_load_attr_list(ni, attr);
163                 if (err)
164                         goto out;
165
166                 le = NULL;
167                 attr = NULL;
168                 goto next_attr;
169
170         case ATTR_NAME:
171                 if (attr->non_res || asize < SIZEOF_ATTRIBUTE_FILENAME + roff ||
172                     rsize < SIZEOF_ATTRIBUTE_FILENAME)
173                         goto out;
174
175                 fname = Add2Ptr(attr, roff);
176                 if (fname->type == FILE_NAME_DOS)
177                         goto next_attr;
178
179                 names += 1;
180                 if (name && name->len == fname->name_len &&
181                     !ntfs_cmp_names_cpu(name, (struct le_str *)&fname->name_len,
182                                         NULL, false))
183                         is_match = true;
184
185                 goto next_attr;
186
187         case ATTR_DATA:
188                 if (is_dir) {
189                         /* Ignore data attribute in dir record. */
190                         goto next_attr;
191                 }
192
193                 if (ino == MFT_REC_BADCLUST && !attr->non_res)
194                         goto next_attr;
195
196                 if (attr->name_len &&
197                     ((ino != MFT_REC_BADCLUST || !attr->non_res ||
198                       attr->name_len != ARRAY_SIZE(BAD_NAME) ||
199                       memcmp(attr_name(attr), BAD_NAME, sizeof(BAD_NAME))) &&
200                      (ino != MFT_REC_SECURE || !attr->non_res ||
201                       attr->name_len != ARRAY_SIZE(SDS_NAME) ||
202                       memcmp(attr_name(attr), SDS_NAME, sizeof(SDS_NAME))))) {
203                         /* File contains stream attribute. Ignore it. */
204                         goto next_attr;
205                 }
206
207                 if (is_attr_sparsed(attr))
208                         ni->std_fa |= FILE_ATTRIBUTE_SPARSE_FILE;
209                 else
210                         ni->std_fa &= ~FILE_ATTRIBUTE_SPARSE_FILE;
211
212                 if (is_attr_compressed(attr))
213                         ni->std_fa |= FILE_ATTRIBUTE_COMPRESSED;
214                 else
215                         ni->std_fa &= ~FILE_ATTRIBUTE_COMPRESSED;
216
217                 if (is_attr_encrypted(attr))
218                         ni->std_fa |= FILE_ATTRIBUTE_ENCRYPTED;
219                 else
220                         ni->std_fa &= ~FILE_ATTRIBUTE_ENCRYPTED;
221
222                 if (!attr->non_res) {
223                         ni->i_valid = inode->i_size = rsize;
224                         inode_set_bytes(inode, rsize);
225                 }
226
227                 mode = S_IFREG | (0777 & sbi->options->fs_fmask_inv);
228
229                 if (!attr->non_res) {
230                         ni->ni_flags |= NI_FLAG_RESIDENT;
231                         goto next_attr;
232                 }
233
234                 inode_set_bytes(inode, attr_ondisk_size(attr));
235
236                 ni->i_valid = le64_to_cpu(attr->nres.valid_size);
237                 inode->i_size = le64_to_cpu(attr->nres.data_size);
238                 if (!attr->nres.alloc_size)
239                         goto next_attr;
240
241                 run = ino == MFT_REC_BITMAP ? &sbi->used.bitmap.run
242                                             : &ni->file.run;
243                 break;
244
245         case ATTR_ROOT:
246                 if (attr->non_res)
247                         goto out;
248
249                 root = Add2Ptr(attr, roff);
250                 is_root = true;
251
252                 if (attr->name_len != ARRAY_SIZE(I30_NAME) ||
253                     memcmp(attr_name(attr), I30_NAME, sizeof(I30_NAME)))
254                         goto next_attr;
255
256                 if (root->type != ATTR_NAME ||
257                     root->rule != NTFS_COLLATION_TYPE_FILENAME)
258                         goto out;
259
260                 if (!is_dir)
261                         goto next_attr;
262
263                 ni->ni_flags |= NI_FLAG_DIR;
264
265                 err = indx_init(&ni->dir, sbi, attr, INDEX_MUTEX_I30);
266                 if (err)
267                         goto out;
268
269                 mode = sb->s_root
270                                ? (S_IFDIR | (0777 & sbi->options->fs_dmask_inv))
271                                : (S_IFDIR | 0777);
272                 goto next_attr;
273
274         case ATTR_ALLOC:
275                 if (!is_root || attr->name_len != ARRAY_SIZE(I30_NAME) ||
276                     memcmp(attr_name(attr), I30_NAME, sizeof(I30_NAME)))
277                         goto next_attr;
278
279                 inode->i_size = le64_to_cpu(attr->nres.data_size);
280                 ni->i_valid = le64_to_cpu(attr->nres.valid_size);
281                 inode_set_bytes(inode, le64_to_cpu(attr->nres.alloc_size));
282
283                 run = &ni->dir.alloc_run;
284                 break;
285
286         case ATTR_BITMAP:
287                 if (ino == MFT_REC_MFT) {
288                         if (!attr->non_res)
289                                 goto out;
290 #ifndef CONFIG_NTFS3_64BIT_CLUSTER
291                         /* 0x20000000 = 2^32 / 8 */
292                         if (le64_to_cpu(attr->nres.alloc_size) >= 0x20000000)
293                                 goto out;
294 #endif
295                         run = &sbi->mft.bitmap.run;
296                         break;
297                 } else if (is_dir && attr->name_len == ARRAY_SIZE(I30_NAME) &&
298                            !memcmp(attr_name(attr), I30_NAME,
299                                    sizeof(I30_NAME)) &&
300                            attr->non_res) {
301                         run = &ni->dir.bitmap_run;
302                         break;
303                 }
304                 goto next_attr;
305
306         case ATTR_REPARSE:
307                 if (attr->name_len)
308                         goto next_attr;
309
310                 rp_fa = ni_parse_reparse(ni, attr, &rp);
311                 switch (rp_fa) {
312                 case REPARSE_LINK:
313                         /*
314                          * Normal symlink.
315                          * Assume one unicode symbol == one utf8.
316                          */
317                         inode->i_size = le16_to_cpu(rp.SymbolicLinkReparseBuffer
318                                                             .PrintNameLength) /
319                                         sizeof(u16);
320
321                         ni->i_valid = inode->i_size;
322
323                         /* Clear directory bit. */
324                         if (ni->ni_flags & NI_FLAG_DIR) {
325                                 indx_clear(&ni->dir);
326                                 memset(&ni->dir, 0, sizeof(ni->dir));
327                                 ni->ni_flags &= ~NI_FLAG_DIR;
328                         } else {
329                                 run_close(&ni->file.run);
330                         }
331                         mode = S_IFLNK | 0777;
332                         is_dir = false;
333                         if (attr->non_res) {
334                                 run = &ni->file.run;
335                                 goto attr_unpack_run; // Double break.
336                         }
337                         break;
338
339                 case REPARSE_COMPRESSED:
340                         break;
341
342                 case REPARSE_DEDUPLICATED:
343                         break;
344                 }
345                 goto next_attr;
346
347         case ATTR_EA_INFO:
348                 if (!attr->name_len &&
349                     resident_data_ex(attr, sizeof(struct EA_INFO))) {
350                         ni->ni_flags |= NI_FLAG_EA;
351                         /*
352                          * ntfs_get_wsl_perm updates inode->i_uid, inode->i_gid, inode->i_mode
353                          */
354                         inode->i_mode = mode;
355                         ntfs_get_wsl_perm(inode);
356                         mode = inode->i_mode;
357                 }
358                 goto next_attr;
359
360         default:
361                 goto next_attr;
362         }
363
364 attr_unpack_run:
365         roff = le16_to_cpu(attr->nres.run_off);
366
367         t64 = le64_to_cpu(attr->nres.svcn);
368         err = run_unpack_ex(run, sbi, ino, t64, le64_to_cpu(attr->nres.evcn),
369                             t64, Add2Ptr(attr, roff), asize - roff);
370         if (err < 0)
371                 goto out;
372         err = 0;
373         goto next_attr;
374
375 end_enum:
376
377         if (!std5)
378                 goto out;
379
380         if (!is_match && name) {
381                 /* Reuse rec as buffer for ascii name. */
382                 err = -ENOENT;
383                 goto out;
384         }
385
386         if (std5->fa & FILE_ATTRIBUTE_READONLY)
387                 mode &= ~0222;
388
389         if (!names) {
390                 err = -EINVAL;
391                 goto out;
392         }
393
394         if (names != le16_to_cpu(rec->hard_links)) {
395                 /* Correct minor error on the fly. Do not mark inode as dirty. */
396                 rec->hard_links = cpu_to_le16(names);
397                 ni->mi.dirty = true;
398         }
399
400         set_nlink(inode, names);
401
402         if (S_ISDIR(mode)) {
403                 ni->std_fa |= FILE_ATTRIBUTE_DIRECTORY;
404
405                 /*
406                  * Dot and dot-dot should be included in count but was not
407                  * included in enumeration.
408                  * Usually a hard links to directories are disabled.
409                  */
410                 inode->i_op = &ntfs_dir_inode_operations;
411                 inode->i_fop = &ntfs_dir_operations;
412                 ni->i_valid = 0;
413         } else if (S_ISLNK(mode)) {
414                 ni->std_fa &= ~FILE_ATTRIBUTE_DIRECTORY;
415                 inode->i_op = &ntfs_link_inode_operations;
416                 inode->i_fop = NULL;
417                 inode_nohighmem(inode);
418         } else if (S_ISREG(mode)) {
419                 ni->std_fa &= ~FILE_ATTRIBUTE_DIRECTORY;
420                 inode->i_op = &ntfs_file_inode_operations;
421                 inode->i_fop = &ntfs_file_operations;
422                 inode->i_mapping->a_ops =
423                         is_compressed(ni) ? &ntfs_aops_cmpr : &ntfs_aops;
424                 if (ino != MFT_REC_MFT)
425                         init_rwsem(&ni->file.run_lock);
426         } else if (S_ISCHR(mode) || S_ISBLK(mode) || S_ISFIFO(mode) ||
427                    S_ISSOCK(mode)) {
428                 inode->i_op = &ntfs_special_inode_operations;
429                 init_special_inode(inode, mode, inode->i_rdev);
430         } else if (fname && fname->home.low == cpu_to_le32(MFT_REC_EXTEND) &&
431                    fname->home.seq == cpu_to_le16(MFT_REC_EXTEND)) {
432                 /* Records in $Extend are not a files or general directories. */
433         } else {
434                 err = -EINVAL;
435                 goto out;
436         }
437
438         if ((sbi->options->sys_immutable &&
439              (std5->fa & FILE_ATTRIBUTE_SYSTEM)) &&
440             !S_ISFIFO(mode) && !S_ISSOCK(mode) && !S_ISLNK(mode)) {
441                 inode->i_flags |= S_IMMUTABLE;
442         } else {
443                 inode->i_flags &= ~S_IMMUTABLE;
444         }
445
446         inode->i_mode = mode;
447         if (!(ni->ni_flags & NI_FLAG_EA)) {
448                 /* If no xattr then no security (stored in xattr). */
449                 inode->i_flags |= S_NOSEC;
450         }
451
452 Ok:
453         if (ino == MFT_REC_MFT && !sb->s_root)
454                 sbi->mft.ni = NULL;
455
456         unlock_new_inode(inode);
457
458         return inode;
459
460 out:
461         if (ino == MFT_REC_MFT && !sb->s_root)
462                 sbi->mft.ni = NULL;
463
464         iget_failed(inode);
465         return ERR_PTR(err);
466 }
467
468 /*
469  * ntfs_test_inode
470  *
471  * Return: 1 if match.
472  */
473 static int ntfs_test_inode(struct inode *inode, void *data)
474 {
475         struct MFT_REF *ref = data;
476
477         return ino_get(ref) == inode->i_ino;
478 }
479
480 static int ntfs_set_inode(struct inode *inode, void *data)
481 {
482         const struct MFT_REF *ref = data;
483
484         inode->i_ino = ino_get(ref);
485         return 0;
486 }
487
488 struct inode *ntfs_iget5(struct super_block *sb, const struct MFT_REF *ref,
489                          const struct cpu_str *name)
490 {
491         struct inode *inode;
492
493         inode = iget5_locked(sb, ino_get(ref), ntfs_test_inode, ntfs_set_inode,
494                              (void *)ref);
495         if (unlikely(!inode))
496                 return ERR_PTR(-ENOMEM);
497
498         /* If this is a freshly allocated inode, need to read it now. */
499         if (inode->i_state & I_NEW)
500                 inode = ntfs_read_mft(inode, name, ref);
501         else if (ref->seq != ntfs_i(inode)->mi.mrec->seq) {
502                 /* Inode overlaps? */
503                 make_bad_inode(inode);
504         }
505
506         return inode;
507 }
508
509 enum get_block_ctx {
510         GET_BLOCK_GENERAL = 0,
511         GET_BLOCK_WRITE_BEGIN = 1,
512         GET_BLOCK_DIRECT_IO_R = 2,
513         GET_BLOCK_DIRECT_IO_W = 3,
514         GET_BLOCK_BMAP = 4,
515 };
516
517 static noinline int ntfs_get_block_vbo(struct inode *inode, u64 vbo,
518                                        struct buffer_head *bh, int create,
519                                        enum get_block_ctx ctx)
520 {
521         struct super_block *sb = inode->i_sb;
522         struct ntfs_sb_info *sbi = sb->s_fs_info;
523         struct ntfs_inode *ni = ntfs_i(inode);
524         struct page *page = bh->b_page;
525         u8 cluster_bits = sbi->cluster_bits;
526         u32 block_size = sb->s_blocksize;
527         u64 bytes, lbo, valid;
528         u32 off;
529         int err;
530         CLST vcn, lcn, len;
531         bool new;
532
533         /* Clear previous state. */
534         clear_buffer_new(bh);
535         clear_buffer_uptodate(bh);
536
537         /* Direct write uses 'create=0'. */
538         if (!create && vbo >= ni->i_valid) {
539                 /* Out of valid. */
540                 return 0;
541         }
542
543         if (vbo >= inode->i_size) {
544                 /* Out of size. */
545                 return 0;
546         }
547
548         if (is_resident(ni)) {
549                 ni_lock(ni);
550                 err = attr_data_read_resident(ni, page);
551                 ni_unlock(ni);
552
553                 if (!err)
554                         set_buffer_uptodate(bh);
555                 bh->b_size = block_size;
556                 return err;
557         }
558
559         vcn = vbo >> cluster_bits;
560         off = vbo & sbi->cluster_mask;
561         new = false;
562
563         err = attr_data_get_block(ni, vcn, 1, &lcn, &len, create ? &new : NULL);
564         if (err)
565                 goto out;
566
567         if (!len)
568                 return 0;
569
570         bytes = ((u64)len << cluster_bits) - off;
571
572         if (lcn == SPARSE_LCN) {
573                 if (!create) {
574                         if (bh->b_size > bytes)
575                                 bh->b_size = bytes;
576                         return 0;
577                 }
578                 WARN_ON(1);
579         }
580
581         if (new) {
582                 set_buffer_new(bh);
583                 if ((len << cluster_bits) > block_size)
584                         ntfs_sparse_cluster(inode, page, vcn, len);
585         }
586
587         lbo = ((u64)lcn << cluster_bits) + off;
588
589         set_buffer_mapped(bh);
590         bh->b_bdev = sb->s_bdev;
591         bh->b_blocknr = lbo >> sb->s_blocksize_bits;
592
593         valid = ni->i_valid;
594
595         if (ctx == GET_BLOCK_DIRECT_IO_W) {
596                 /* ntfs_direct_IO will update ni->i_valid. */
597                 if (vbo >= valid)
598                         set_buffer_new(bh);
599         } else if (create) {
600                 /* Normal write. */
601                 if (bytes > bh->b_size)
602                         bytes = bh->b_size;
603
604                 if (vbo >= valid)
605                         set_buffer_new(bh);
606
607                 if (vbo + bytes > valid) {
608                         ni->i_valid = vbo + bytes;
609                         mark_inode_dirty(inode);
610                 }
611         } else if (vbo >= valid) {
612                 /* Read out of valid data. */
613                 /* Should never be here 'cause already checked. */
614                 clear_buffer_mapped(bh);
615         } else if (vbo + bytes <= valid) {
616                 /* Normal read. */
617         } else if (vbo + block_size <= valid) {
618                 /* Normal short read. */
619                 bytes = block_size;
620         } else {
621                 /*
622                  * Read across valid size: vbo < valid && valid < vbo + block_size
623                  */
624                 bytes = block_size;
625
626                 if (page) {
627                         u32 voff = valid - vbo;
628
629                         bh->b_size = block_size;
630                         off = vbo & (PAGE_SIZE - 1);
631                         set_bh_page(bh, page, off);
632                         ll_rw_block(REQ_OP_READ, 0, 1, &bh);
633                         wait_on_buffer(bh);
634                         if (!buffer_uptodate(bh)) {
635                                 err = -EIO;
636                                 goto out;
637                         }
638                         zero_user_segment(page, off + voff, off + block_size);
639                 }
640         }
641
642         if (bh->b_size > bytes)
643                 bh->b_size = bytes;
644
645 #ifndef __LP64__
646         if (ctx == GET_BLOCK_DIRECT_IO_W || ctx == GET_BLOCK_DIRECT_IO_R) {
647                 static_assert(sizeof(size_t) < sizeof(loff_t));
648                 if (bytes > 0x40000000u)
649                         bh->b_size = 0x40000000u;
650         }
651 #endif
652
653         return 0;
654
655 out:
656         return err;
657 }
658
659 int ntfs_get_block(struct inode *inode, sector_t vbn,
660                    struct buffer_head *bh_result, int create)
661 {
662         return ntfs_get_block_vbo(inode, (u64)vbn << inode->i_blkbits,
663                                   bh_result, create, GET_BLOCK_GENERAL);
664 }
665
666 static int ntfs_get_block_bmap(struct inode *inode, sector_t vsn,
667                                struct buffer_head *bh_result, int create)
668 {
669         return ntfs_get_block_vbo(inode,
670                                   (u64)vsn << inode->i_sb->s_blocksize_bits,
671                                   bh_result, create, GET_BLOCK_BMAP);
672 }
673
674 static sector_t ntfs_bmap(struct address_space *mapping, sector_t block)
675 {
676         return generic_block_bmap(mapping, block, ntfs_get_block_bmap);
677 }
678
679 static int ntfs_read_folio(struct file *file, struct folio *folio)
680 {
681         struct page *page = &folio->page;
682         int err;
683         struct address_space *mapping = page->mapping;
684         struct inode *inode = mapping->host;
685         struct ntfs_inode *ni = ntfs_i(inode);
686
687         if (is_resident(ni)) {
688                 ni_lock(ni);
689                 err = attr_data_read_resident(ni, page);
690                 ni_unlock(ni);
691                 if (err != E_NTFS_NONRESIDENT) {
692                         unlock_page(page);
693                         return err;
694                 }
695         }
696
697         if (is_compressed(ni)) {
698                 ni_lock(ni);
699                 err = ni_readpage_cmpr(ni, page);
700                 ni_unlock(ni);
701                 return err;
702         }
703
704         /* Normal + sparse files. */
705         return mpage_read_folio(folio, ntfs_get_block);
706 }
707
708 static void ntfs_readahead(struct readahead_control *rac)
709 {
710         struct address_space *mapping = rac->mapping;
711         struct inode *inode = mapping->host;
712         struct ntfs_inode *ni = ntfs_i(inode);
713         u64 valid;
714         loff_t pos;
715
716         if (is_resident(ni)) {
717                 /* No readahead for resident. */
718                 return;
719         }
720
721         if (is_compressed(ni)) {
722                 /* No readahead for compressed. */
723                 return;
724         }
725
726         valid = ni->i_valid;
727         pos = readahead_pos(rac);
728
729         if (valid < i_size_read(inode) && pos <= valid &&
730             valid < pos + readahead_length(rac)) {
731                 /* Range cross 'valid'. Read it page by page. */
732                 return;
733         }
734
735         mpage_readahead(rac, ntfs_get_block);
736 }
737
738 static int ntfs_get_block_direct_IO_R(struct inode *inode, sector_t iblock,
739                                       struct buffer_head *bh_result, int create)
740 {
741         return ntfs_get_block_vbo(inode, (u64)iblock << inode->i_blkbits,
742                                   bh_result, create, GET_BLOCK_DIRECT_IO_R);
743 }
744
745 static int ntfs_get_block_direct_IO_W(struct inode *inode, sector_t iblock,
746                                       struct buffer_head *bh_result, int create)
747 {
748         return ntfs_get_block_vbo(inode, (u64)iblock << inode->i_blkbits,
749                                   bh_result, create, GET_BLOCK_DIRECT_IO_W);
750 }
751
752 static ssize_t ntfs_direct_IO(struct kiocb *iocb, struct iov_iter *iter)
753 {
754         struct file *file = iocb->ki_filp;
755         struct address_space *mapping = file->f_mapping;
756         struct inode *inode = mapping->host;
757         struct ntfs_inode *ni = ntfs_i(inode);
758         loff_t vbo = iocb->ki_pos;
759         loff_t end;
760         int wr = iov_iter_rw(iter) & WRITE;
761         loff_t valid;
762         ssize_t ret;
763
764         if (is_resident(ni)) {
765                 /* Switch to buffered write. */
766                 ret = 0;
767                 goto out;
768         }
769
770         ret = blockdev_direct_IO(iocb, inode, iter,
771                                  wr ? ntfs_get_block_direct_IO_W
772                                     : ntfs_get_block_direct_IO_R);
773
774         if (ret <= 0)
775                 goto out;
776
777         end = vbo + ret;
778         valid = ni->i_valid;
779         if (wr) {
780                 if (end > valid && !S_ISBLK(inode->i_mode)) {
781                         ni->i_valid = end;
782                         mark_inode_dirty(inode);
783                 }
784         } else if (vbo < valid && valid < end) {
785                 /* Fix page. */
786                 iov_iter_revert(iter, end - valid);
787                 iov_iter_zero(end - valid, iter);
788         }
789
790 out:
791         return ret;
792 }
793
794 int ntfs_set_size(struct inode *inode, u64 new_size)
795 {
796         struct super_block *sb = inode->i_sb;
797         struct ntfs_sb_info *sbi = sb->s_fs_info;
798         struct ntfs_inode *ni = ntfs_i(inode);
799         int err;
800
801         /* Check for maximum file size. */
802         if (is_sparsed(ni) || is_compressed(ni)) {
803                 if (new_size > sbi->maxbytes_sparse) {
804                         err = -EFBIG;
805                         goto out;
806                 }
807         } else if (new_size > sbi->maxbytes) {
808                 err = -EFBIG;
809                 goto out;
810         }
811
812         ni_lock(ni);
813         down_write(&ni->file.run_lock);
814
815         err = attr_set_size(ni, ATTR_DATA, NULL, 0, &ni->file.run, new_size,
816                             &ni->i_valid, true, NULL);
817
818         up_write(&ni->file.run_lock);
819         ni_unlock(ni);
820
821         mark_inode_dirty(inode);
822
823 out:
824         return err;
825 }
826
827 static int ntfs_writepage(struct page *page, struct writeback_control *wbc)
828 {
829         struct address_space *mapping = page->mapping;
830         struct inode *inode = mapping->host;
831         struct ntfs_inode *ni = ntfs_i(inode);
832         int err;
833
834         if (is_resident(ni)) {
835                 ni_lock(ni);
836                 err = attr_data_write_resident(ni, page);
837                 ni_unlock(ni);
838                 if (err != E_NTFS_NONRESIDENT) {
839                         unlock_page(page);
840                         return err;
841                 }
842         }
843
844         return block_write_full_page(page, ntfs_get_block, wbc);
845 }
846
847 static int ntfs_writepages(struct address_space *mapping,
848                            struct writeback_control *wbc)
849 {
850         struct inode *inode = mapping->host;
851         struct ntfs_inode *ni = ntfs_i(inode);
852         /* Redirect call to 'ntfs_writepage' for resident files. */
853         get_block_t *get_block = is_resident(ni) ? NULL : &ntfs_get_block;
854
855         return mpage_writepages(mapping, wbc, get_block);
856 }
857
858 static int ntfs_get_block_write_begin(struct inode *inode, sector_t vbn,
859                                       struct buffer_head *bh_result, int create)
860 {
861         return ntfs_get_block_vbo(inode, (u64)vbn << inode->i_blkbits,
862                                   bh_result, create, GET_BLOCK_WRITE_BEGIN);
863 }
864
865 int ntfs_write_begin(struct file *file, struct address_space *mapping,
866                      loff_t pos, u32 len, struct page **pagep, void **fsdata)
867 {
868         int err;
869         struct inode *inode = mapping->host;
870         struct ntfs_inode *ni = ntfs_i(inode);
871
872         *pagep = NULL;
873         if (is_resident(ni)) {
874                 struct page *page = grab_cache_page_write_begin(
875                         mapping, pos >> PAGE_SHIFT);
876
877                 if (!page) {
878                         err = -ENOMEM;
879                         goto out;
880                 }
881
882                 ni_lock(ni);
883                 err = attr_data_read_resident(ni, page);
884                 ni_unlock(ni);
885
886                 if (!err) {
887                         *pagep = page;
888                         goto out;
889                 }
890                 unlock_page(page);
891                 put_page(page);
892
893                 if (err != E_NTFS_NONRESIDENT)
894                         goto out;
895         }
896
897         err = block_write_begin(mapping, pos, len, pagep,
898                                 ntfs_get_block_write_begin);
899
900 out:
901         return err;
902 }
903
904 /*
905  * ntfs_write_end - Address_space_operations::write_end.
906  */
907 int ntfs_write_end(struct file *file, struct address_space *mapping,
908                    loff_t pos, u32 len, u32 copied, struct page *page,
909                    void *fsdata)
910 {
911         struct inode *inode = mapping->host;
912         struct ntfs_inode *ni = ntfs_i(inode);
913         u64 valid = ni->i_valid;
914         bool dirty = false;
915         int err;
916
917         if (is_resident(ni)) {
918                 ni_lock(ni);
919                 err = attr_data_write_resident(ni, page);
920                 ni_unlock(ni);
921                 if (!err) {
922                         dirty = true;
923                         /* Clear any buffers in page. */
924                         if (page_has_buffers(page)) {
925                                 struct buffer_head *head, *bh;
926
927                                 bh = head = page_buffers(page);
928                                 do {
929                                         clear_buffer_dirty(bh);
930                                         clear_buffer_mapped(bh);
931                                         set_buffer_uptodate(bh);
932                                 } while (head != (bh = bh->b_this_page));
933                         }
934                         SetPageUptodate(page);
935                         err = copied;
936                 }
937                 unlock_page(page);
938                 put_page(page);
939         } else {
940                 err = generic_write_end(file, mapping, pos, len, copied, page,
941                                         fsdata);
942         }
943
944         if (err >= 0) {
945                 if (!(ni->std_fa & FILE_ATTRIBUTE_ARCHIVE)) {
946                         inode->i_ctime = inode->i_mtime = current_time(inode);
947                         ni->std_fa |= FILE_ATTRIBUTE_ARCHIVE;
948                         dirty = true;
949                 }
950
951                 if (valid != ni->i_valid) {
952                         /* ni->i_valid is changed in ntfs_get_block_vbo. */
953                         dirty = true;
954                 }
955
956                 if (dirty)
957                         mark_inode_dirty(inode);
958         }
959
960         return err;
961 }
962
963 int reset_log_file(struct inode *inode)
964 {
965         int err;
966         loff_t pos = 0;
967         u32 log_size = inode->i_size;
968         struct address_space *mapping = inode->i_mapping;
969
970         for (;;) {
971                 u32 len;
972                 void *kaddr;
973                 struct page *page;
974
975                 len = pos + PAGE_SIZE > log_size ? (log_size - pos) : PAGE_SIZE;
976
977                 err = block_write_begin(mapping, pos, len, &page,
978                                         ntfs_get_block_write_begin);
979                 if (err)
980                         goto out;
981
982                 kaddr = kmap_atomic(page);
983                 memset(kaddr, -1, len);
984                 kunmap_atomic(kaddr);
985                 flush_dcache_page(page);
986
987                 err = block_write_end(NULL, mapping, pos, len, len, page, NULL);
988                 if (err < 0)
989                         goto out;
990                 pos += len;
991
992                 if (pos >= log_size)
993                         break;
994                 balance_dirty_pages_ratelimited(mapping);
995         }
996 out:
997         mark_inode_dirty_sync(inode);
998
999         return err;
1000 }
1001
1002 int ntfs3_write_inode(struct inode *inode, struct writeback_control *wbc)
1003 {
1004         return _ni_write_inode(inode, wbc->sync_mode == WB_SYNC_ALL);
1005 }
1006
1007 int ntfs_sync_inode(struct inode *inode)
1008 {
1009         return _ni_write_inode(inode, 1);
1010 }
1011
1012 /*
1013  * writeback_inode - Helper function for ntfs_flush_inodes().
1014  *
1015  * This writes both the inode and the file data blocks, waiting
1016  * for in flight data blocks before the start of the call.  It
1017  * does not wait for any io started during the call.
1018  */
1019 static int writeback_inode(struct inode *inode)
1020 {
1021         int ret = sync_inode_metadata(inode, 0);
1022
1023         if (!ret)
1024                 ret = filemap_fdatawrite(inode->i_mapping);
1025         return ret;
1026 }
1027
1028 /*
1029  * ntfs_flush_inodes
1030  *
1031  * Write data and metadata corresponding to i1 and i2.  The io is
1032  * started but we do not wait for any of it to finish.
1033  *
1034  * filemap_flush() is used for the block device, so if there is a dirty
1035  * page for a block already in flight, we will not wait and start the
1036  * io over again.
1037  */
1038 int ntfs_flush_inodes(struct super_block *sb, struct inode *i1,
1039                       struct inode *i2)
1040 {
1041         int ret = 0;
1042
1043         if (i1)
1044                 ret = writeback_inode(i1);
1045         if (!ret && i2)
1046                 ret = writeback_inode(i2);
1047         if (!ret)
1048                 ret = sync_blockdev_nowait(sb->s_bdev);
1049         return ret;
1050 }
1051
1052 int inode_write_data(struct inode *inode, const void *data, size_t bytes)
1053 {
1054         pgoff_t idx;
1055
1056         /* Write non resident data. */
1057         for (idx = 0; bytes; idx++) {
1058                 size_t op = bytes > PAGE_SIZE ? PAGE_SIZE : bytes;
1059                 struct page *page = ntfs_map_page(inode->i_mapping, idx);
1060
1061                 if (IS_ERR(page))
1062                         return PTR_ERR(page);
1063
1064                 lock_page(page);
1065                 WARN_ON(!PageUptodate(page));
1066                 ClearPageUptodate(page);
1067
1068                 memcpy(page_address(page), data, op);
1069
1070                 flush_dcache_page(page);
1071                 SetPageUptodate(page);
1072                 unlock_page(page);
1073
1074                 ntfs_unmap_page(page);
1075
1076                 bytes -= op;
1077                 data = Add2Ptr(data, PAGE_SIZE);
1078         }
1079         return 0;
1080 }
1081
1082 /*
1083  * ntfs_reparse_bytes
1084  *
1085  * Number of bytes for REPARSE_DATA_BUFFER(IO_REPARSE_TAG_SYMLINK)
1086  * for unicode string of @uni_len length.
1087  */
1088 static inline u32 ntfs_reparse_bytes(u32 uni_len)
1089 {
1090         /* Header + unicode string + decorated unicode string. */
1091         return sizeof(short) * (2 * uni_len + 4) +
1092                offsetof(struct REPARSE_DATA_BUFFER,
1093                         SymbolicLinkReparseBuffer.PathBuffer);
1094 }
1095
1096 static struct REPARSE_DATA_BUFFER *
1097 ntfs_create_reparse_buffer(struct ntfs_sb_info *sbi, const char *symname,
1098                            u32 size, u16 *nsize)
1099 {
1100         int i, err;
1101         struct REPARSE_DATA_BUFFER *rp;
1102         __le16 *rp_name;
1103         typeof(rp->SymbolicLinkReparseBuffer) *rs;
1104
1105         rp = kzalloc(ntfs_reparse_bytes(2 * size + 2), GFP_NOFS);
1106         if (!rp)
1107                 return ERR_PTR(-ENOMEM);
1108
1109         rs = &rp->SymbolicLinkReparseBuffer;
1110         rp_name = rs->PathBuffer;
1111
1112         /* Convert link name to UTF-16. */
1113         err = ntfs_nls_to_utf16(sbi, symname, size,
1114                                 (struct cpu_str *)(rp_name - 1), 2 * size,
1115                                 UTF16_LITTLE_ENDIAN);
1116         if (err < 0)
1117                 goto out;
1118
1119         /* err = the length of unicode name of symlink. */
1120         *nsize = ntfs_reparse_bytes(err);
1121
1122         if (*nsize > sbi->reparse.max_size) {
1123                 err = -EFBIG;
1124                 goto out;
1125         }
1126
1127         /* Translate Linux '/' into Windows '\'. */
1128         for (i = 0; i < err; i++) {
1129                 if (rp_name[i] == cpu_to_le16('/'))
1130                         rp_name[i] = cpu_to_le16('\\');
1131         }
1132
1133         rp->ReparseTag = IO_REPARSE_TAG_SYMLINK;
1134         rp->ReparseDataLength =
1135                 cpu_to_le16(*nsize - offsetof(struct REPARSE_DATA_BUFFER,
1136                                               SymbolicLinkReparseBuffer));
1137
1138         /* PrintName + SubstituteName. */
1139         rs->SubstituteNameOffset = cpu_to_le16(sizeof(short) * err);
1140         rs->SubstituteNameLength = cpu_to_le16(sizeof(short) * err + 8);
1141         rs->PrintNameLength = rs->SubstituteNameOffset;
1142
1143         /*
1144          * TODO: Use relative path if possible to allow Windows to
1145          * parse this path.
1146          * 0-absolute path 1- relative path (SYMLINK_FLAG_RELATIVE).
1147          */
1148         rs->Flags = 0;
1149
1150         memmove(rp_name + err + 4, rp_name, sizeof(short) * err);
1151
1152         /* Decorate SubstituteName. */
1153         rp_name += err;
1154         rp_name[0] = cpu_to_le16('\\');
1155         rp_name[1] = cpu_to_le16('?');
1156         rp_name[2] = cpu_to_le16('?');
1157         rp_name[3] = cpu_to_le16('\\');
1158
1159         return rp;
1160 out:
1161         kfree(rp);
1162         return ERR_PTR(err);
1163 }
1164
1165 struct inode *ntfs_create_inode(struct user_namespace *mnt_userns,
1166                                 struct inode *dir, struct dentry *dentry,
1167                                 const struct cpu_str *uni, umode_t mode,
1168                                 dev_t dev, const char *symname, u32 size,
1169                                 struct ntfs_fnd *fnd)
1170 {
1171         int err;
1172         struct super_block *sb = dir->i_sb;
1173         struct ntfs_sb_info *sbi = sb->s_fs_info;
1174         const struct qstr *name = &dentry->d_name;
1175         CLST ino = 0;
1176         struct ntfs_inode *dir_ni = ntfs_i(dir);
1177         struct ntfs_inode *ni = NULL;
1178         struct inode *inode = NULL;
1179         struct ATTRIB *attr;
1180         struct ATTR_STD_INFO5 *std5;
1181         struct ATTR_FILE_NAME *fname;
1182         struct MFT_REC *rec;
1183         u32 asize, dsize, sd_size;
1184         enum FILE_ATTRIBUTE fa;
1185         __le32 security_id = SECURITY_ID_INVALID;
1186         CLST vcn;
1187         const void *sd;
1188         u16 t16, nsize = 0, aid = 0;
1189         struct INDEX_ROOT *root, *dir_root;
1190         struct NTFS_DE *e, *new_de = NULL;
1191         struct REPARSE_DATA_BUFFER *rp = NULL;
1192         bool rp_inserted = false;
1193
1194         ni_lock_dir(dir_ni);
1195
1196         dir_root = indx_get_root(&dir_ni->dir, dir_ni, NULL, NULL);
1197         if (!dir_root) {
1198                 err = -EINVAL;
1199                 goto out1;
1200         }
1201
1202         if (S_ISDIR(mode)) {
1203                 /* Use parent's directory attributes. */
1204                 fa = dir_ni->std_fa | FILE_ATTRIBUTE_DIRECTORY |
1205                      FILE_ATTRIBUTE_ARCHIVE;
1206                 /*
1207                  * By default child directory inherits parent attributes.
1208                  * Root directory is hidden + system.
1209                  * Make an exception for children in root.
1210                  */
1211                 if (dir->i_ino == MFT_REC_ROOT)
1212                         fa &= ~(FILE_ATTRIBUTE_HIDDEN | FILE_ATTRIBUTE_SYSTEM);
1213         } else if (S_ISLNK(mode)) {
1214                 /* It is good idea that link should be the same type (file/dir) as target */
1215                 fa = FILE_ATTRIBUTE_REPARSE_POINT;
1216
1217                 /*
1218                  * Linux: there are dir/file/symlink and so on.
1219                  * NTFS: symlinks are "dir + reparse" or "file + reparse"
1220                  * It is good idea to create:
1221                  * dir + reparse if 'symname' points to directory
1222                  * or
1223                  * file + reparse if 'symname' points to file
1224                  * Unfortunately kern_path hangs if symname contains 'dir'.
1225                  */
1226
1227                 /*
1228                  *      struct path path;
1229                  *
1230                  *      if (!kern_path(symname, LOOKUP_FOLLOW, &path)){
1231                  *              struct inode *target = d_inode(path.dentry);
1232                  *
1233                  *              if (S_ISDIR(target->i_mode))
1234                  *                      fa |= FILE_ATTRIBUTE_DIRECTORY;
1235                  *              // if ( target->i_sb == sb ){
1236                  *              //      use relative path?
1237                  *              // }
1238                  *              path_put(&path);
1239                  *      }
1240                  */
1241         } else if (S_ISREG(mode)) {
1242                 if (sbi->options->sparse) {
1243                         /* Sparsed regular file, cause option 'sparse'. */
1244                         fa = FILE_ATTRIBUTE_SPARSE_FILE |
1245                              FILE_ATTRIBUTE_ARCHIVE;
1246                 } else if (dir_ni->std_fa & FILE_ATTRIBUTE_COMPRESSED) {
1247                         /* Compressed regular file, if parent is compressed. */
1248                         fa = FILE_ATTRIBUTE_COMPRESSED | FILE_ATTRIBUTE_ARCHIVE;
1249                 } else {
1250                         /* Regular file, default attributes. */
1251                         fa = FILE_ATTRIBUTE_ARCHIVE;
1252                 }
1253         } else {
1254                 fa = FILE_ATTRIBUTE_ARCHIVE;
1255         }
1256
1257         if (!(mode & 0222))
1258                 fa |= FILE_ATTRIBUTE_READONLY;
1259
1260         /* Allocate PATH_MAX bytes. */
1261         new_de = __getname();
1262         if (!new_de) {
1263                 err = -ENOMEM;
1264                 goto out1;
1265         }
1266
1267         /* Mark rw ntfs as dirty. it will be cleared at umount. */
1268         ntfs_set_state(sbi, NTFS_DIRTY_DIRTY);
1269
1270         /* Step 1: allocate and fill new mft record. */
1271         err = ntfs_look_free_mft(sbi, &ino, false, NULL, NULL);
1272         if (err)
1273                 goto out2;
1274
1275         ni = ntfs_new_inode(sbi, ino, fa & FILE_ATTRIBUTE_DIRECTORY);
1276         if (IS_ERR(ni)) {
1277                 err = PTR_ERR(ni);
1278                 ni = NULL;
1279                 goto out3;
1280         }
1281         inode = &ni->vfs_inode;
1282         inode_init_owner(mnt_userns, inode, dir, mode);
1283         mode = inode->i_mode;
1284
1285         inode->i_atime = inode->i_mtime = inode->i_ctime = ni->i_crtime =
1286                 current_time(inode);
1287
1288         rec = ni->mi.mrec;
1289         rec->hard_links = cpu_to_le16(1);
1290         attr = Add2Ptr(rec, le16_to_cpu(rec->attr_off));
1291
1292         /* Get default security id. */
1293         sd = s_default_security;
1294         sd_size = sizeof(s_default_security);
1295
1296         if (is_ntfs3(sbi)) {
1297                 security_id = dir_ni->std_security_id;
1298                 if (le32_to_cpu(security_id) < SECURITY_ID_FIRST) {
1299                         security_id = sbi->security.def_security_id;
1300
1301                         if (security_id == SECURITY_ID_INVALID &&
1302                             !ntfs_insert_security(sbi, sd, sd_size,
1303                                                   &security_id, NULL))
1304                                 sbi->security.def_security_id = security_id;
1305                 }
1306         }
1307
1308         /* Insert standard info. */
1309         std5 = Add2Ptr(attr, SIZEOF_RESIDENT);
1310
1311         if (security_id == SECURITY_ID_INVALID) {
1312                 dsize = sizeof(struct ATTR_STD_INFO);
1313         } else {
1314                 dsize = sizeof(struct ATTR_STD_INFO5);
1315                 std5->security_id = security_id;
1316                 ni->std_security_id = security_id;
1317         }
1318         asize = SIZEOF_RESIDENT + dsize;
1319
1320         attr->type = ATTR_STD;
1321         attr->size = cpu_to_le32(asize);
1322         attr->id = cpu_to_le16(aid++);
1323         attr->res.data_off = SIZEOF_RESIDENT_LE;
1324         attr->res.data_size = cpu_to_le32(dsize);
1325
1326         std5->cr_time = std5->m_time = std5->c_time = std5->a_time =
1327                 kernel2nt(&inode->i_atime);
1328
1329         ni->std_fa = fa;
1330         std5->fa = fa;
1331
1332         attr = Add2Ptr(attr, asize);
1333
1334         /* Insert file name. */
1335         err = fill_name_de(sbi, new_de, name, uni);
1336         if (err)
1337                 goto out4;
1338
1339         mi_get_ref(&ni->mi, &new_de->ref);
1340
1341         fname = (struct ATTR_FILE_NAME *)(new_de + 1);
1342         mi_get_ref(&dir_ni->mi, &fname->home);
1343         fname->dup.cr_time = fname->dup.m_time = fname->dup.c_time =
1344                 fname->dup.a_time = std5->cr_time;
1345         fname->dup.alloc_size = fname->dup.data_size = 0;
1346         fname->dup.fa = std5->fa;
1347         fname->dup.ea_size = fname->dup.reparse = 0;
1348
1349         dsize = le16_to_cpu(new_de->key_size);
1350         asize = ALIGN(SIZEOF_RESIDENT + dsize, 8);
1351
1352         attr->type = ATTR_NAME;
1353         attr->size = cpu_to_le32(asize);
1354         attr->res.data_off = SIZEOF_RESIDENT_LE;
1355         attr->res.flags = RESIDENT_FLAG_INDEXED;
1356         attr->id = cpu_to_le16(aid++);
1357         attr->res.data_size = cpu_to_le32(dsize);
1358         memcpy(Add2Ptr(attr, SIZEOF_RESIDENT), fname, dsize);
1359
1360         attr = Add2Ptr(attr, asize);
1361
1362         if (security_id == SECURITY_ID_INVALID) {
1363                 /* Insert security attribute. */
1364                 asize = SIZEOF_RESIDENT + ALIGN(sd_size, 8);
1365
1366                 attr->type = ATTR_SECURE;
1367                 attr->size = cpu_to_le32(asize);
1368                 attr->id = cpu_to_le16(aid++);
1369                 attr->res.data_off = SIZEOF_RESIDENT_LE;
1370                 attr->res.data_size = cpu_to_le32(sd_size);
1371                 memcpy(Add2Ptr(attr, SIZEOF_RESIDENT), sd, sd_size);
1372
1373                 attr = Add2Ptr(attr, asize);
1374         }
1375
1376         attr->id = cpu_to_le16(aid++);
1377         if (fa & FILE_ATTRIBUTE_DIRECTORY) {
1378                 /*
1379                  * Regular directory or symlink to directory.
1380                  * Create root attribute.
1381                  */
1382                 dsize = sizeof(struct INDEX_ROOT) + sizeof(struct NTFS_DE);
1383                 asize = sizeof(I30_NAME) + SIZEOF_RESIDENT + dsize;
1384
1385                 attr->type = ATTR_ROOT;
1386                 attr->size = cpu_to_le32(asize);
1387
1388                 attr->name_len = ARRAY_SIZE(I30_NAME);
1389                 attr->name_off = SIZEOF_RESIDENT_LE;
1390                 attr->res.data_off =
1391                         cpu_to_le16(sizeof(I30_NAME) + SIZEOF_RESIDENT);
1392                 attr->res.data_size = cpu_to_le32(dsize);
1393                 memcpy(Add2Ptr(attr, SIZEOF_RESIDENT), I30_NAME,
1394                        sizeof(I30_NAME));
1395
1396                 root = Add2Ptr(attr, sizeof(I30_NAME) + SIZEOF_RESIDENT);
1397                 memcpy(root, dir_root, offsetof(struct INDEX_ROOT, ihdr));
1398                 root->ihdr.de_off =
1399                         cpu_to_le32(sizeof(struct INDEX_HDR)); // 0x10
1400                 root->ihdr.used = cpu_to_le32(sizeof(struct INDEX_HDR) +
1401                                               sizeof(struct NTFS_DE));
1402                 root->ihdr.total = root->ihdr.used;
1403
1404                 e = Add2Ptr(root, sizeof(struct INDEX_ROOT));
1405                 e->size = cpu_to_le16(sizeof(struct NTFS_DE));
1406                 e->flags = NTFS_IE_LAST;
1407         } else if (S_ISLNK(mode)) {
1408                 /*
1409                  * Symlink to file.
1410                  * Create empty resident data attribute.
1411                  */
1412                 asize = SIZEOF_RESIDENT;
1413
1414                 /* Insert empty ATTR_DATA */
1415                 attr->type = ATTR_DATA;
1416                 attr->size = cpu_to_le32(SIZEOF_RESIDENT);
1417                 attr->name_off = SIZEOF_RESIDENT_LE;
1418                 attr->res.data_off = SIZEOF_RESIDENT_LE;
1419         } else if (S_ISREG(mode)) {
1420                 /*
1421                  * Regular file. Create empty non resident data attribute.
1422                  */
1423                 attr->type = ATTR_DATA;
1424                 attr->non_res = 1;
1425                 attr->nres.evcn = cpu_to_le64(-1ll);
1426                 if (fa & FILE_ATTRIBUTE_SPARSE_FILE) {
1427                         attr->size = cpu_to_le32(SIZEOF_NONRESIDENT_EX + 8);
1428                         attr->name_off = SIZEOF_NONRESIDENT_EX_LE;
1429                         attr->flags = ATTR_FLAG_SPARSED;
1430                         asize = SIZEOF_NONRESIDENT_EX + 8;
1431                 } else if (fa & FILE_ATTRIBUTE_COMPRESSED) {
1432                         attr->size = cpu_to_le32(SIZEOF_NONRESIDENT_EX + 8);
1433                         attr->name_off = SIZEOF_NONRESIDENT_EX_LE;
1434                         attr->flags = ATTR_FLAG_COMPRESSED;
1435                         attr->nres.c_unit = COMPRESSION_UNIT;
1436                         asize = SIZEOF_NONRESIDENT_EX + 8;
1437                 } else {
1438                         attr->size = cpu_to_le32(SIZEOF_NONRESIDENT + 8);
1439                         attr->name_off = SIZEOF_NONRESIDENT_LE;
1440                         asize = SIZEOF_NONRESIDENT + 8;
1441                 }
1442                 attr->nres.run_off = attr->name_off;
1443         } else {
1444                 /*
1445                  * Node. Create empty resident data attribute.
1446                  */
1447                 attr->type = ATTR_DATA;
1448                 attr->size = cpu_to_le32(SIZEOF_RESIDENT);
1449                 attr->name_off = SIZEOF_RESIDENT_LE;
1450                 if (fa & FILE_ATTRIBUTE_SPARSE_FILE)
1451                         attr->flags = ATTR_FLAG_SPARSED;
1452                 else if (fa & FILE_ATTRIBUTE_COMPRESSED)
1453                         attr->flags = ATTR_FLAG_COMPRESSED;
1454                 attr->res.data_off = SIZEOF_RESIDENT_LE;
1455                 asize = SIZEOF_RESIDENT;
1456                 ni->ni_flags |= NI_FLAG_RESIDENT;
1457         }
1458
1459         if (S_ISDIR(mode)) {
1460                 ni->ni_flags |= NI_FLAG_DIR;
1461                 err = indx_init(&ni->dir, sbi, attr, INDEX_MUTEX_I30);
1462                 if (err)
1463                         goto out4;
1464         } else if (S_ISLNK(mode)) {
1465                 rp = ntfs_create_reparse_buffer(sbi, symname, size, &nsize);
1466
1467                 if (IS_ERR(rp)) {
1468                         err = PTR_ERR(rp);
1469                         rp = NULL;
1470                         goto out4;
1471                 }
1472
1473                 /*
1474                  * Insert ATTR_REPARSE.
1475                  */
1476                 attr = Add2Ptr(attr, asize);
1477                 attr->type = ATTR_REPARSE;
1478                 attr->id = cpu_to_le16(aid++);
1479
1480                 /* Resident or non resident? */
1481                 asize = ALIGN(SIZEOF_RESIDENT + nsize, 8);
1482                 t16 = PtrOffset(rec, attr);
1483
1484                 /*
1485                  * Below function 'ntfs_save_wsl_perm' requires 0x78 bytes.
1486                  * It is good idea to keep extened attributes resident.
1487                  */
1488                 if (asize + t16 + 0x78 + 8 > sbi->record_size) {
1489                         CLST alen;
1490                         CLST clst = bytes_to_cluster(sbi, nsize);
1491
1492                         /* Bytes per runs. */
1493                         t16 = sbi->record_size - t16 - SIZEOF_NONRESIDENT;
1494
1495                         attr->non_res = 1;
1496                         attr->nres.evcn = cpu_to_le64(clst - 1);
1497                         attr->name_off = SIZEOF_NONRESIDENT_LE;
1498                         attr->nres.run_off = attr->name_off;
1499                         attr->nres.data_size = cpu_to_le64(nsize);
1500                         attr->nres.valid_size = attr->nres.data_size;
1501                         attr->nres.alloc_size =
1502                                 cpu_to_le64(ntfs_up_cluster(sbi, nsize));
1503
1504                         err = attr_allocate_clusters(sbi, &ni->file.run, 0, 0,
1505                                                      clst, NULL, 0, &alen, 0,
1506                                                      NULL);
1507                         if (err)
1508                                 goto out5;
1509
1510                         err = run_pack(&ni->file.run, 0, clst,
1511                                        Add2Ptr(attr, SIZEOF_NONRESIDENT), t16,
1512                                        &vcn);
1513                         if (err < 0)
1514                                 goto out5;
1515
1516                         if (vcn != clst) {
1517                                 err = -EINVAL;
1518                                 goto out5;
1519                         }
1520
1521                         asize = SIZEOF_NONRESIDENT + ALIGN(err, 8);
1522                 } else {
1523                         attr->res.data_off = SIZEOF_RESIDENT_LE;
1524                         attr->res.data_size = cpu_to_le32(nsize);
1525                         memcpy(Add2Ptr(attr, SIZEOF_RESIDENT), rp, nsize);
1526                         nsize = 0;
1527                 }
1528                 /* Size of symlink equals the length of input string. */
1529                 inode->i_size = size;
1530
1531                 attr->size = cpu_to_le32(asize);
1532
1533                 err = ntfs_insert_reparse(sbi, IO_REPARSE_TAG_SYMLINK,
1534                                           &new_de->ref);
1535                 if (err)
1536                         goto out5;
1537
1538                 rp_inserted = true;
1539         }
1540
1541         attr = Add2Ptr(attr, asize);
1542         attr->type = ATTR_END;
1543
1544         rec->used = cpu_to_le32(PtrOffset(rec, attr) + 8);
1545         rec->next_attr_id = cpu_to_le16(aid);
1546
1547         /* Step 2: Add new name in index. */
1548         err = indx_insert_entry(&dir_ni->dir, dir_ni, new_de, sbi, fnd, 0);
1549         if (err)
1550                 goto out6;
1551
1552         /* Unlock parent directory before ntfs_init_acl. */
1553         ni_unlock(dir_ni);
1554
1555         inode->i_generation = le16_to_cpu(rec->seq);
1556
1557         dir->i_mtime = dir->i_ctime = inode->i_atime;
1558
1559         if (S_ISDIR(mode)) {
1560                 inode->i_op = &ntfs_dir_inode_operations;
1561                 inode->i_fop = &ntfs_dir_operations;
1562         } else if (S_ISLNK(mode)) {
1563                 inode->i_op = &ntfs_link_inode_operations;
1564                 inode->i_fop = NULL;
1565                 inode->i_mapping->a_ops = &ntfs_aops;
1566                 inode->i_size = size;
1567                 inode_nohighmem(inode);
1568         } else if (S_ISREG(mode)) {
1569                 inode->i_op = &ntfs_file_inode_operations;
1570                 inode->i_fop = &ntfs_file_operations;
1571                 inode->i_mapping->a_ops =
1572                         is_compressed(ni) ? &ntfs_aops_cmpr : &ntfs_aops;
1573                 init_rwsem(&ni->file.run_lock);
1574         } else {
1575                 inode->i_op = &ntfs_special_inode_operations;
1576                 init_special_inode(inode, mode, dev);
1577         }
1578
1579 #ifdef CONFIG_NTFS3_FS_POSIX_ACL
1580         if (!S_ISLNK(mode) && (sb->s_flags & SB_POSIXACL)) {
1581                 err = ntfs_init_acl(mnt_userns, inode, dir);
1582                 if (err)
1583                         goto out7;
1584         } else
1585 #endif
1586         {
1587                 inode->i_flags |= S_NOSEC;
1588         }
1589
1590         /* Write non resident data. */
1591         if (nsize) {
1592                 err = ntfs_sb_write_run(sbi, &ni->file.run, 0, rp, nsize, 0);
1593                 if (err)
1594                         goto out7;
1595         }
1596
1597         /*
1598          * Call 'd_instantiate' after inode->i_op is set
1599          * but before finish_open.
1600          */
1601         d_instantiate(dentry, inode);
1602
1603         ntfs_save_wsl_perm(inode);
1604         mark_inode_dirty(dir);
1605         mark_inode_dirty(inode);
1606
1607         /* Normal exit. */
1608         goto out2;
1609
1610 out7:
1611
1612         /* Undo 'indx_insert_entry'. */
1613         ni_lock_dir(dir_ni);
1614         indx_delete_entry(&dir_ni->dir, dir_ni, new_de + 1,
1615                           le16_to_cpu(new_de->key_size), sbi);
1616         /* ni_unlock(dir_ni); will be called later. */
1617 out6:
1618         if (rp_inserted)
1619                 ntfs_remove_reparse(sbi, IO_REPARSE_TAG_SYMLINK, &new_de->ref);
1620
1621 out5:
1622         if (S_ISDIR(mode) || run_is_empty(&ni->file.run))
1623                 goto out4;
1624
1625         run_deallocate(sbi, &ni->file.run, false);
1626
1627 out4:
1628         clear_rec_inuse(rec);
1629         clear_nlink(inode);
1630         ni->mi.dirty = false;
1631         discard_new_inode(inode);
1632 out3:
1633         ntfs_mark_rec_free(sbi, ino);
1634
1635 out2:
1636         __putname(new_de);
1637         kfree(rp);
1638
1639 out1:
1640         if (err) {
1641                 ni_unlock(dir_ni);
1642                 return ERR_PTR(err);
1643         }
1644
1645         unlock_new_inode(inode);
1646
1647         return inode;
1648 }
1649
1650 int ntfs_link_inode(struct inode *inode, struct dentry *dentry)
1651 {
1652         int err;
1653         struct ntfs_inode *ni = ntfs_i(inode);
1654         struct ntfs_sb_info *sbi = inode->i_sb->s_fs_info;
1655         struct NTFS_DE *de;
1656         struct ATTR_FILE_NAME *de_name;
1657
1658         /* Allocate PATH_MAX bytes. */
1659         de = __getname();
1660         if (!de)
1661                 return -ENOMEM;
1662
1663         /* Mark rw ntfs as dirty. It will be cleared at umount. */
1664         ntfs_set_state(sbi, NTFS_DIRTY_DIRTY);
1665
1666         /* Construct 'de'. */
1667         err = fill_name_de(sbi, de, &dentry->d_name, NULL);
1668         if (err)
1669                 goto out;
1670
1671         de_name = (struct ATTR_FILE_NAME *)(de + 1);
1672         /* Fill duplicate info. */
1673         de_name->dup.cr_time = de_name->dup.m_time = de_name->dup.c_time =
1674                 de_name->dup.a_time = kernel2nt(&inode->i_ctime);
1675         de_name->dup.alloc_size = de_name->dup.data_size =
1676                 cpu_to_le64(inode->i_size);
1677         de_name->dup.fa = ni->std_fa;
1678         de_name->dup.ea_size = de_name->dup.reparse = 0;
1679
1680         err = ni_add_name(ntfs_i(d_inode(dentry->d_parent)), ni, de);
1681 out:
1682         __putname(de);
1683         return err;
1684 }
1685
1686 /*
1687  * ntfs_unlink_inode
1688  *
1689  * inode_operations::unlink
1690  * inode_operations::rmdir
1691  */
1692 int ntfs_unlink_inode(struct inode *dir, const struct dentry *dentry)
1693 {
1694         int err;
1695         struct ntfs_sb_info *sbi = dir->i_sb->s_fs_info;
1696         struct inode *inode = d_inode(dentry);
1697         struct ntfs_inode *ni = ntfs_i(inode);
1698         struct ntfs_inode *dir_ni = ntfs_i(dir);
1699         struct NTFS_DE *de, *de2 = NULL;
1700         int undo_remove;
1701
1702         if (ntfs_is_meta_file(sbi, ni->mi.rno))
1703                 return -EINVAL;
1704
1705         /* Allocate PATH_MAX bytes. */
1706         de = __getname();
1707         if (!de)
1708                 return -ENOMEM;
1709
1710         ni_lock(ni);
1711
1712         if (S_ISDIR(inode->i_mode) && !dir_is_empty(inode)) {
1713                 err = -ENOTEMPTY;
1714                 goto out;
1715         }
1716
1717         err = fill_name_de(sbi, de, &dentry->d_name, NULL);
1718         if (err < 0)
1719                 goto out;
1720
1721         undo_remove = 0;
1722         err = ni_remove_name(dir_ni, ni, de, &de2, &undo_remove);
1723
1724         if (!err) {
1725                 drop_nlink(inode);
1726                 dir->i_mtime = dir->i_ctime = current_time(dir);
1727                 mark_inode_dirty(dir);
1728                 inode->i_ctime = dir->i_ctime;
1729                 if (inode->i_nlink)
1730                         mark_inode_dirty(inode);
1731         } else if (!ni_remove_name_undo(dir_ni, ni, de, de2, undo_remove)) {
1732                 make_bad_inode(inode);
1733                 ntfs_inode_err(inode, "failed to undo unlink");
1734                 ntfs_set_state(sbi, NTFS_DIRTY_ERROR);
1735         } else {
1736                 if (ni_is_dirty(dir))
1737                         mark_inode_dirty(dir);
1738                 if (ni_is_dirty(inode))
1739                         mark_inode_dirty(inode);
1740         }
1741
1742 out:
1743         ni_unlock(ni);
1744         __putname(de);
1745         return err;
1746 }
1747
1748 void ntfs_evict_inode(struct inode *inode)
1749 {
1750         truncate_inode_pages_final(&inode->i_data);
1751
1752         if (inode->i_nlink)
1753                 _ni_write_inode(inode, inode_needs_sync(inode));
1754
1755         invalidate_inode_buffers(inode);
1756         clear_inode(inode);
1757
1758         ni_clear(ntfs_i(inode));
1759 }
1760
1761 static noinline int ntfs_readlink_hlp(struct inode *inode, char *buffer,
1762                                       int buflen)
1763 {
1764         int i, err = -EINVAL;
1765         struct ntfs_inode *ni = ntfs_i(inode);
1766         struct super_block *sb = inode->i_sb;
1767         struct ntfs_sb_info *sbi = sb->s_fs_info;
1768         u64 size;
1769         u16 ulen = 0;
1770         void *to_free = NULL;
1771         struct REPARSE_DATA_BUFFER *rp;
1772         const __le16 *uname;
1773         struct ATTRIB *attr;
1774
1775         /* Reparse data present. Try to parse it. */
1776         static_assert(!offsetof(struct REPARSE_DATA_BUFFER, ReparseTag));
1777         static_assert(sizeof(u32) == sizeof(rp->ReparseTag));
1778
1779         *buffer = 0;
1780
1781         attr = ni_find_attr(ni, NULL, NULL, ATTR_REPARSE, NULL, 0, NULL, NULL);
1782         if (!attr)
1783                 goto out;
1784
1785         if (!attr->non_res) {
1786                 rp = resident_data_ex(attr, sizeof(struct REPARSE_DATA_BUFFER));
1787                 if (!rp)
1788                         goto out;
1789                 size = le32_to_cpu(attr->res.data_size);
1790         } else {
1791                 size = le64_to_cpu(attr->nres.data_size);
1792                 rp = NULL;
1793         }
1794
1795         if (size > sbi->reparse.max_size || size <= sizeof(u32))
1796                 goto out;
1797
1798         if (!rp) {
1799                 rp = kmalloc(size, GFP_NOFS);
1800                 if (!rp) {
1801                         err = -ENOMEM;
1802                         goto out;
1803                 }
1804                 to_free = rp;
1805                 /* Read into temporal buffer. */
1806                 err = ntfs_read_run_nb(sbi, &ni->file.run, 0, rp, size, NULL);
1807                 if (err)
1808                         goto out;
1809         }
1810
1811         /* Microsoft Tag. */
1812         switch (rp->ReparseTag) {
1813         case IO_REPARSE_TAG_MOUNT_POINT:
1814                 /* Mount points and junctions. */
1815                 /* Can we use 'Rp->MountPointReparseBuffer.PrintNameLength'? */
1816                 if (size <= offsetof(struct REPARSE_DATA_BUFFER,
1817                                      MountPointReparseBuffer.PathBuffer))
1818                         goto out;
1819                 uname = Add2Ptr(rp,
1820                                 offsetof(struct REPARSE_DATA_BUFFER,
1821                                          MountPointReparseBuffer.PathBuffer) +
1822                                         le16_to_cpu(rp->MountPointReparseBuffer
1823                                                             .PrintNameOffset));
1824                 ulen = le16_to_cpu(rp->MountPointReparseBuffer.PrintNameLength);
1825                 break;
1826
1827         case IO_REPARSE_TAG_SYMLINK:
1828                 /* FolderSymbolicLink */
1829                 /* Can we use 'Rp->SymbolicLinkReparseBuffer.PrintNameLength'? */
1830                 if (size <= offsetof(struct REPARSE_DATA_BUFFER,
1831                                      SymbolicLinkReparseBuffer.PathBuffer))
1832                         goto out;
1833                 uname = Add2Ptr(
1834                         rp, offsetof(struct REPARSE_DATA_BUFFER,
1835                                      SymbolicLinkReparseBuffer.PathBuffer) +
1836                                     le16_to_cpu(rp->SymbolicLinkReparseBuffer
1837                                                         .PrintNameOffset));
1838                 ulen = le16_to_cpu(
1839                         rp->SymbolicLinkReparseBuffer.PrintNameLength);
1840                 break;
1841
1842         case IO_REPARSE_TAG_CLOUD:
1843         case IO_REPARSE_TAG_CLOUD_1:
1844         case IO_REPARSE_TAG_CLOUD_2:
1845         case IO_REPARSE_TAG_CLOUD_3:
1846         case IO_REPARSE_TAG_CLOUD_4:
1847         case IO_REPARSE_TAG_CLOUD_5:
1848         case IO_REPARSE_TAG_CLOUD_6:
1849         case IO_REPARSE_TAG_CLOUD_7:
1850         case IO_REPARSE_TAG_CLOUD_8:
1851         case IO_REPARSE_TAG_CLOUD_9:
1852         case IO_REPARSE_TAG_CLOUD_A:
1853         case IO_REPARSE_TAG_CLOUD_B:
1854         case IO_REPARSE_TAG_CLOUD_C:
1855         case IO_REPARSE_TAG_CLOUD_D:
1856         case IO_REPARSE_TAG_CLOUD_E:
1857         case IO_REPARSE_TAG_CLOUD_F:
1858                 err = sizeof("OneDrive") - 1;
1859                 if (err > buflen)
1860                         err = buflen;
1861                 memcpy(buffer, "OneDrive", err);
1862                 goto out;
1863
1864         default:
1865                 if (IsReparseTagMicrosoft(rp->ReparseTag)) {
1866                         /* Unknown Microsoft Tag. */
1867                         goto out;
1868                 }
1869                 if (!IsReparseTagNameSurrogate(rp->ReparseTag) ||
1870                     size <= sizeof(struct REPARSE_POINT)) {
1871                         goto out;
1872                 }
1873
1874                 /* Users tag. */
1875                 uname = Add2Ptr(rp, sizeof(struct REPARSE_POINT));
1876                 ulen = le16_to_cpu(rp->ReparseDataLength) -
1877                        sizeof(struct REPARSE_POINT);
1878         }
1879
1880         /* Convert nlen from bytes to UNICODE chars. */
1881         ulen >>= 1;
1882
1883         /* Check that name is available. */
1884         if (!ulen || uname + ulen > (__le16 *)Add2Ptr(rp, size))
1885                 goto out;
1886
1887         /* If name is already zero terminated then truncate it now. */
1888         if (!uname[ulen - 1])
1889                 ulen -= 1;
1890
1891         err = ntfs_utf16_to_nls(sbi, uname, ulen, buffer, buflen);
1892
1893         if (err < 0)
1894                 goto out;
1895
1896         /* Translate Windows '\' into Linux '/'. */
1897         for (i = 0; i < err; i++) {
1898                 if (buffer[i] == '\\')
1899                         buffer[i] = '/';
1900         }
1901
1902         /* Always set last zero. */
1903         buffer[err] = 0;
1904 out:
1905         kfree(to_free);
1906         return err;
1907 }
1908
1909 static const char *ntfs_get_link(struct dentry *de, struct inode *inode,
1910                                  struct delayed_call *done)
1911 {
1912         int err;
1913         char *ret;
1914
1915         if (!de)
1916                 return ERR_PTR(-ECHILD);
1917
1918         ret = kmalloc(PAGE_SIZE, GFP_NOFS);
1919         if (!ret)
1920                 return ERR_PTR(-ENOMEM);
1921
1922         err = ntfs_readlink_hlp(inode, ret, PAGE_SIZE);
1923         if (err < 0) {
1924                 kfree(ret);
1925                 return ERR_PTR(err);
1926         }
1927
1928         set_delayed_call(done, kfree_link, ret);
1929
1930         return ret;
1931 }
1932
1933 // clang-format off
1934 const struct inode_operations ntfs_link_inode_operations = {
1935         .get_link       = ntfs_get_link,
1936         .setattr        = ntfs3_setattr,
1937         .listxattr      = ntfs_listxattr,
1938         .permission     = ntfs_permission,
1939         .get_acl        = ntfs_get_acl,
1940         .set_acl        = ntfs_set_acl,
1941 };
1942
1943 const struct address_space_operations ntfs_aops = {
1944         .read_folio     = ntfs_read_folio,
1945         .readahead      = ntfs_readahead,
1946         .writepage      = ntfs_writepage,
1947         .writepages     = ntfs_writepages,
1948         .write_begin    = ntfs_write_begin,
1949         .write_end      = ntfs_write_end,
1950         .direct_IO      = ntfs_direct_IO,
1951         .bmap           = ntfs_bmap,
1952         .dirty_folio    = block_dirty_folio,
1953 };
1954
1955 const struct address_space_operations ntfs_aops_cmpr = {
1956         .read_folio     = ntfs_read_folio,
1957         .readahead      = ntfs_readahead,
1958 };
1959 // clang-format on