linux/fs/nilfs2/sufile.c
<<
>>
Prefs
   1/*
   2 * sufile.c - NILFS segment usage file.
   3 *
   4 * Copyright (C) 2006-2008 Nippon Telegraph and Telephone Corporation.
   5 *
   6 * This program is free software; you can redistribute it and/or modify
   7 * it under the terms of the GNU General Public License as published by
   8 * the Free Software Foundation; either version 2 of the License, or
   9 * (at your option) any later version.
  10 *
  11 * This program is distributed in the hope that it will be useful,
  12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14 * GNU General Public License for more details.
  15 *
  16 * You should have received a copy of the GNU General Public License
  17 * along with this program; if not, write to the Free Software
  18 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
  19 *
  20 * Written by Koji Sato <koji@osrg.net>.
  21 * Revised by Ryusuke Konishi <ryusuke@osrg.net>.
  22 */
  23
  24#include <linux/kernel.h>
  25#include <linux/fs.h>
  26#include <linux/string.h>
  27#include <linux/buffer_head.h>
  28#include <linux/errno.h>
  29#include <linux/nilfs2_fs.h>
  30#include "mdt.h"
  31#include "sufile.h"
  32
  33/**
  34 * struct nilfs_sufile_info - on-memory private data of sufile
  35 * @mi: on-memory private data of metadata file
  36 * @ncleansegs: number of clean segments
  37 * @allocmin: lower limit of allocatable segment range
  38 * @allocmax: upper limit of allocatable segment range
  39 */
  40struct nilfs_sufile_info {
  41        struct nilfs_mdt_info mi;
  42        unsigned long ncleansegs;/* number of clean segments */
  43        __u64 allocmin;         /* lower limit of allocatable segment range */
  44        __u64 allocmax;         /* upper limit of allocatable segment range */
  45};
  46
  47static inline struct nilfs_sufile_info *NILFS_SUI(struct inode *sufile)
  48{
  49        return (struct nilfs_sufile_info *)NILFS_MDT(sufile);
  50}
  51
  52static inline unsigned long
  53nilfs_sufile_segment_usages_per_block(const struct inode *sufile)
  54{
  55        return NILFS_MDT(sufile)->mi_entries_per_block;
  56}
  57
  58static unsigned long
  59nilfs_sufile_get_blkoff(const struct inode *sufile, __u64 segnum)
  60{
  61        __u64 t = segnum + NILFS_MDT(sufile)->mi_first_entry_offset;
  62        do_div(t, nilfs_sufile_segment_usages_per_block(sufile));
  63        return (unsigned long)t;
  64}
  65
  66static unsigned long
  67nilfs_sufile_get_offset(const struct inode *sufile, __u64 segnum)
  68{
  69        __u64 t = segnum + NILFS_MDT(sufile)->mi_first_entry_offset;
  70        return do_div(t, nilfs_sufile_segment_usages_per_block(sufile));
  71}
  72
  73static unsigned long
  74nilfs_sufile_segment_usages_in_block(const struct inode *sufile, __u64 curr,
  75                                     __u64 max)
  76{
  77        return min_t(unsigned long,
  78                     nilfs_sufile_segment_usages_per_block(sufile) -
  79                     nilfs_sufile_get_offset(sufile, curr),
  80                     max - curr + 1);
  81}
  82
  83static struct nilfs_segment_usage *
  84nilfs_sufile_block_get_segment_usage(const struct inode *sufile, __u64 segnum,
  85                                     struct buffer_head *bh, void *kaddr)
  86{
  87        return kaddr + bh_offset(bh) +
  88                nilfs_sufile_get_offset(sufile, segnum) *
  89                NILFS_MDT(sufile)->mi_entry_size;
  90}
  91
  92static inline int nilfs_sufile_get_header_block(struct inode *sufile,
  93                                                struct buffer_head **bhp)
  94{
  95        return nilfs_mdt_get_block(sufile, 0, 0, NULL, bhp);
  96}
  97
  98static inline int
  99nilfs_sufile_get_segment_usage_block(struct inode *sufile, __u64 segnum,
 100                                     int create, struct buffer_head **bhp)
 101{
 102        return nilfs_mdt_get_block(sufile,
 103                                   nilfs_sufile_get_blkoff(sufile, segnum),
 104                                   create, NULL, bhp);
 105}
 106
 107static int nilfs_sufile_delete_segment_usage_block(struct inode *sufile,
 108                                                   __u64 segnum)
 109{
 110        return nilfs_mdt_delete_block(sufile,
 111                                      nilfs_sufile_get_blkoff(sufile, segnum));
 112}
 113
 114static void nilfs_sufile_mod_counter(struct buffer_head *header_bh,
 115                                     u64 ncleanadd, u64 ndirtyadd)
 116{
 117        struct nilfs_sufile_header *header;
 118        void *kaddr;
 119
 120        kaddr = kmap_atomic(header_bh->b_page);
 121        header = kaddr + bh_offset(header_bh);
 122        le64_add_cpu(&header->sh_ncleansegs, ncleanadd);
 123        le64_add_cpu(&header->sh_ndirtysegs, ndirtyadd);
 124        kunmap_atomic(kaddr);
 125
 126        mark_buffer_dirty(header_bh);
 127}
 128
 129/**
 130 * nilfs_sufile_get_ncleansegs - return the number of clean segments
 131 * @sufile: inode of segment usage file
 132 */
 133unsigned long nilfs_sufile_get_ncleansegs(struct inode *sufile)
 134{
 135        return NILFS_SUI(sufile)->ncleansegs;
 136}
 137
 138/**
 139 * nilfs_sufile_updatev - modify multiple segment usages at a time
 140 * @sufile: inode of segment usage file
 141 * @segnumv: array of segment numbers
 142 * @nsegs: size of @segnumv array
 143 * @create: creation flag
 144 * @ndone: place to store number of modified segments on @segnumv
 145 * @dofunc: primitive operation for the update
 146 *
 147 * Description: nilfs_sufile_updatev() repeatedly calls @dofunc
 148 * against the given array of segments.  The @dofunc is called with
 149 * buffers of a header block and the sufile block in which the target
 150 * segment usage entry is contained.  If @ndone is given, the number
 151 * of successfully modified segments from the head is stored in the
 152 * place @ndone points to.
 153 *
 154 * Return Value: On success, zero is returned.  On error, one of the
 155 * following negative error codes is returned.
 156 *
 157 * %-EIO - I/O error.
 158 *
 159 * %-ENOMEM - Insufficient amount of memory available.
 160 *
 161 * %-ENOENT - Given segment usage is in hole block (may be returned if
 162 *            @create is zero)
 163 *
 164 * %-EINVAL - Invalid segment usage number
 165 */
 166int nilfs_sufile_updatev(struct inode *sufile, __u64 *segnumv, size_t nsegs,
 167                         int create, size_t *ndone,
 168                         void (*dofunc)(struct inode *, __u64,
 169                                        struct buffer_head *,
 170                                        struct buffer_head *))
 171{
 172        struct buffer_head *header_bh, *bh;
 173        unsigned long blkoff, prev_blkoff;
 174        __u64 *seg;
 175        size_t nerr = 0, n = 0;
 176        int ret = 0;
 177
 178        if (unlikely(nsegs == 0))
 179                goto out;
 180
 181        down_write(&NILFS_MDT(sufile)->mi_sem);
 182        for (seg = segnumv; seg < segnumv + nsegs; seg++) {
 183                if (unlikely(*seg >= nilfs_sufile_get_nsegments(sufile))) {
 184                        printk(KERN_WARNING
 185                               "%s: invalid segment number: %llu\n", __func__,
 186                               (unsigned long long)*seg);
 187                        nerr++;
 188                }
 189        }
 190        if (nerr > 0) {
 191                ret = -EINVAL;
 192                goto out_sem;
 193        }
 194
 195        ret = nilfs_sufile_get_header_block(sufile, &header_bh);
 196        if (ret < 0)
 197                goto out_sem;
 198
 199        seg = segnumv;
 200        blkoff = nilfs_sufile_get_blkoff(sufile, *seg);
 201        ret = nilfs_mdt_get_block(sufile, blkoff, create, NULL, &bh);
 202        if (ret < 0)
 203                goto out_header;
 204
 205        for (;;) {
 206                dofunc(sufile, *seg, header_bh, bh);
 207
 208                if (++seg >= segnumv + nsegs)
 209                        break;
 210                prev_blkoff = blkoff;
 211                blkoff = nilfs_sufile_get_blkoff(sufile, *seg);
 212                if (blkoff == prev_blkoff)
 213                        continue;
 214
 215                /* get different block */
 216                brelse(bh);
 217                ret = nilfs_mdt_get_block(sufile, blkoff, create, NULL, &bh);
 218                if (unlikely(ret < 0))
 219                        goto out_header;
 220        }
 221        brelse(bh);
 222
 223 out_header:
 224        n = seg - segnumv;
 225        brelse(header_bh);
 226 out_sem:
 227        up_write(&NILFS_MDT(sufile)->mi_sem);
 228 out:
 229        if (ndone)
 230                *ndone = n;
 231        return ret;
 232}
 233
 234int nilfs_sufile_update(struct inode *sufile, __u64 segnum, int create,
 235                        void (*dofunc)(struct inode *, __u64,
 236                                       struct buffer_head *,
 237                                       struct buffer_head *))
 238{
 239        struct buffer_head *header_bh, *bh;
 240        int ret;
 241
 242        if (unlikely(segnum >= nilfs_sufile_get_nsegments(sufile))) {
 243                printk(KERN_WARNING "%s: invalid segment number: %llu\n",
 244                       __func__, (unsigned long long)segnum);
 245                return -EINVAL;
 246        }
 247        down_write(&NILFS_MDT(sufile)->mi_sem);
 248
 249        ret = nilfs_sufile_get_header_block(sufile, &header_bh);
 250        if (ret < 0)
 251                goto out_sem;
 252
 253        ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, create, &bh);
 254        if (!ret) {
 255                dofunc(sufile, segnum, header_bh, bh);
 256                brelse(bh);
 257        }
 258        brelse(header_bh);
 259
 260 out_sem:
 261        up_write(&NILFS_MDT(sufile)->mi_sem);
 262        return ret;
 263}
 264
 265/**
 266 * nilfs_sufile_set_alloc_range - limit range of segment to be allocated
 267 * @sufile: inode of segment usage file
 268 * @start: minimum segment number of allocatable region (inclusive)
 269 * @end: maximum segment number of allocatable region (inclusive)
 270 *
 271 * Return Value: On success, 0 is returned.  On error, one of the
 272 * following negative error codes is returned.
 273 *
 274 * %-ERANGE - invalid segment region
 275 */
 276int nilfs_sufile_set_alloc_range(struct inode *sufile, __u64 start, __u64 end)
 277{
 278        struct nilfs_sufile_info *sui = NILFS_SUI(sufile);
 279        __u64 nsegs;
 280        int ret = -ERANGE;
 281
 282        down_write(&NILFS_MDT(sufile)->mi_sem);
 283        nsegs = nilfs_sufile_get_nsegments(sufile);
 284
 285        if (start <= end && end < nsegs) {
 286                sui->allocmin = start;
 287                sui->allocmax = end;
 288                ret = 0;
 289        }
 290        up_write(&NILFS_MDT(sufile)->mi_sem);
 291        return ret;
 292}
 293
 294/**
 295 * nilfs_sufile_alloc - allocate a segment
 296 * @sufile: inode of segment usage file
 297 * @segnump: pointer to segment number
 298 *
 299 * Description: nilfs_sufile_alloc() allocates a clean segment.
 300 *
 301 * Return Value: On success, 0 is returned and the segment number of the
 302 * allocated segment is stored in the place pointed by @segnump. On error, one
 303 * of the following negative error codes is returned.
 304 *
 305 * %-EIO - I/O error.
 306 *
 307 * %-ENOMEM - Insufficient amount of memory available.
 308 *
 309 * %-ENOSPC - No clean segment left.
 310 */
 311int nilfs_sufile_alloc(struct inode *sufile, __u64 *segnump)
 312{
 313        struct buffer_head *header_bh, *su_bh;
 314        struct nilfs_sufile_header *header;
 315        struct nilfs_segment_usage *su;
 316        struct nilfs_sufile_info *sui = NILFS_SUI(sufile);
 317        size_t susz = NILFS_MDT(sufile)->mi_entry_size;
 318        __u64 segnum, maxsegnum, last_alloc;
 319        void *kaddr;
 320        unsigned long nsegments, ncleansegs, nsus, cnt;
 321        int ret, j;
 322
 323        down_write(&NILFS_MDT(sufile)->mi_sem);
 324
 325        ret = nilfs_sufile_get_header_block(sufile, &header_bh);
 326        if (ret < 0)
 327                goto out_sem;
 328        kaddr = kmap_atomic(header_bh->b_page);
 329        header = kaddr + bh_offset(header_bh);
 330        ncleansegs = le64_to_cpu(header->sh_ncleansegs);
 331        last_alloc = le64_to_cpu(header->sh_last_alloc);
 332        kunmap_atomic(kaddr);
 333
 334        nsegments = nilfs_sufile_get_nsegments(sufile);
 335        maxsegnum = sui->allocmax;
 336        segnum = last_alloc + 1;
 337        if (segnum < sui->allocmin || segnum > sui->allocmax)
 338                segnum = sui->allocmin;
 339
 340        for (cnt = 0; cnt < nsegments; cnt += nsus) {
 341                if (segnum > maxsegnum) {
 342                        if (cnt < sui->allocmax - sui->allocmin + 1) {
 343                                /*
 344                                 * wrap around in the limited region.
 345                                 * if allocation started from
 346                                 * sui->allocmin, this never happens.
 347                                 */
 348                                segnum = sui->allocmin;
 349                                maxsegnum = last_alloc;
 350                        } else if (segnum > sui->allocmin &&
 351                                   sui->allocmax + 1 < nsegments) {
 352                                segnum = sui->allocmax + 1;
 353                                maxsegnum = nsegments - 1;
 354                        } else if (sui->allocmin > 0)  {
 355                                segnum = 0;
 356                                maxsegnum = sui->allocmin - 1;
 357                        } else {
 358                                break; /* never happens */
 359                        }
 360                }
 361                ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 1,
 362                                                           &su_bh);
 363                if (ret < 0)
 364                        goto out_header;
 365                kaddr = kmap_atomic(su_bh->b_page);
 366                su = nilfs_sufile_block_get_segment_usage(
 367                        sufile, segnum, su_bh, kaddr);
 368
 369                nsus = nilfs_sufile_segment_usages_in_block(
 370                        sufile, segnum, maxsegnum);
 371                for (j = 0; j < nsus; j++, su = (void *)su + susz, segnum++) {
 372                        if (!nilfs_segment_usage_clean(su))
 373                                continue;
 374                        /* found a clean segment */
 375                        nilfs_segment_usage_set_dirty(su);
 376                        kunmap_atomic(kaddr);
 377
 378                        kaddr = kmap_atomic(header_bh->b_page);
 379                        header = kaddr + bh_offset(header_bh);
 380                        le64_add_cpu(&header->sh_ncleansegs, -1);
 381                        le64_add_cpu(&header->sh_ndirtysegs, 1);
 382                        header->sh_last_alloc = cpu_to_le64(segnum);
 383                        kunmap_atomic(kaddr);
 384
 385                        sui->ncleansegs--;
 386                        mark_buffer_dirty(header_bh);
 387                        mark_buffer_dirty(su_bh);
 388                        nilfs_mdt_mark_dirty(sufile);
 389                        brelse(su_bh);
 390                        *segnump = segnum;
 391                        goto out_header;
 392                }
 393
 394                kunmap_atomic(kaddr);
 395                brelse(su_bh);
 396        }
 397
 398        /* no segments left */
 399        ret = -ENOSPC;
 400
 401 out_header:
 402        brelse(header_bh);
 403
 404 out_sem:
 405        up_write(&NILFS_MDT(sufile)->mi_sem);
 406        return ret;
 407}
 408
 409void nilfs_sufile_do_cancel_free(struct inode *sufile, __u64 segnum,
 410                                 struct buffer_head *header_bh,
 411                                 struct buffer_head *su_bh)
 412{
 413        struct nilfs_segment_usage *su;
 414        void *kaddr;
 415
 416        kaddr = kmap_atomic(su_bh->b_page);
 417        su = nilfs_sufile_block_get_segment_usage(sufile, segnum, su_bh, kaddr);
 418        if (unlikely(!nilfs_segment_usage_clean(su))) {
 419                printk(KERN_WARNING "%s: segment %llu must be clean\n",
 420                       __func__, (unsigned long long)segnum);
 421                kunmap_atomic(kaddr);
 422                return;
 423        }
 424        nilfs_segment_usage_set_dirty(su);
 425        kunmap_atomic(kaddr);
 426
 427        nilfs_sufile_mod_counter(header_bh, -1, 1);
 428        NILFS_SUI(sufile)->ncleansegs--;
 429
 430        mark_buffer_dirty(su_bh);
 431        nilfs_mdt_mark_dirty(sufile);
 432}
 433
 434void nilfs_sufile_do_scrap(struct inode *sufile, __u64 segnum,
 435                           struct buffer_head *header_bh,
 436                           struct buffer_head *su_bh)
 437{
 438        struct nilfs_segment_usage *su;
 439        void *kaddr;
 440        int clean, dirty;
 441
 442        kaddr = kmap_atomic(su_bh->b_page);
 443        su = nilfs_sufile_block_get_segment_usage(sufile, segnum, su_bh, kaddr);
 444        if (su->su_flags == cpu_to_le32(1UL << NILFS_SEGMENT_USAGE_DIRTY) &&
 445            su->su_nblocks == cpu_to_le32(0)) {
 446                kunmap_atomic(kaddr);
 447                return;
 448        }
 449        clean = nilfs_segment_usage_clean(su);
 450        dirty = nilfs_segment_usage_dirty(su);
 451
 452        /* make the segment garbage */
 453        su->su_lastmod = cpu_to_le64(0);
 454        su->su_nblocks = cpu_to_le32(0);
 455        su->su_flags = cpu_to_le32(1UL << NILFS_SEGMENT_USAGE_DIRTY);
 456        kunmap_atomic(kaddr);
 457
 458        nilfs_sufile_mod_counter(header_bh, clean ? (u64)-1 : 0, dirty ? 0 : 1);
 459        NILFS_SUI(sufile)->ncleansegs -= clean;
 460
 461        mark_buffer_dirty(su_bh);
 462        nilfs_mdt_mark_dirty(sufile);
 463}
 464
 465void nilfs_sufile_do_free(struct inode *sufile, __u64 segnum,
 466                          struct buffer_head *header_bh,
 467                          struct buffer_head *su_bh)
 468{
 469        struct nilfs_segment_usage *su;
 470        void *kaddr;
 471        int sudirty;
 472
 473        kaddr = kmap_atomic(su_bh->b_page);
 474        su = nilfs_sufile_block_get_segment_usage(sufile, segnum, su_bh, kaddr);
 475        if (nilfs_segment_usage_clean(su)) {
 476                printk(KERN_WARNING "%s: segment %llu is already clean\n",
 477                       __func__, (unsigned long long)segnum);
 478                kunmap_atomic(kaddr);
 479                return;
 480        }
 481        WARN_ON(nilfs_segment_usage_error(su));
 482        WARN_ON(!nilfs_segment_usage_dirty(su));
 483
 484        sudirty = nilfs_segment_usage_dirty(su);
 485        nilfs_segment_usage_set_clean(su);
 486        kunmap_atomic(kaddr);
 487        mark_buffer_dirty(su_bh);
 488
 489        nilfs_sufile_mod_counter(header_bh, 1, sudirty ? (u64)-1 : 0);
 490        NILFS_SUI(sufile)->ncleansegs++;
 491
 492        nilfs_mdt_mark_dirty(sufile);
 493}
 494
 495/**
 496 * nilfs_sufile_mark_dirty - mark the buffer having a segment usage dirty
 497 * @sufile: inode of segment usage file
 498 * @segnum: segment number
 499 */
 500int nilfs_sufile_mark_dirty(struct inode *sufile, __u64 segnum)
 501{
 502        struct buffer_head *bh;
 503        int ret;
 504
 505        ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0, &bh);
 506        if (!ret) {
 507                mark_buffer_dirty(bh);
 508                nilfs_mdt_mark_dirty(sufile);
 509                brelse(bh);
 510        }
 511        return ret;
 512}
 513
 514/**
 515 * nilfs_sufile_set_segment_usage - set usage of a segment
 516 * @sufile: inode of segment usage file
 517 * @segnum: segment number
 518 * @nblocks: number of live blocks in the segment
 519 * @modtime: modification time (option)
 520 */
 521int nilfs_sufile_set_segment_usage(struct inode *sufile, __u64 segnum,
 522                                   unsigned long nblocks, time_t modtime)
 523{
 524        struct buffer_head *bh;
 525        struct nilfs_segment_usage *su;
 526        void *kaddr;
 527        int ret;
 528
 529        down_write(&NILFS_MDT(sufile)->mi_sem);
 530        ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0, &bh);
 531        if (ret < 0)
 532                goto out_sem;
 533
 534        kaddr = kmap_atomic(bh->b_page);
 535        su = nilfs_sufile_block_get_segment_usage(sufile, segnum, bh, kaddr);
 536        WARN_ON(nilfs_segment_usage_error(su));
 537        if (modtime)
 538                su->su_lastmod = cpu_to_le64(modtime);
 539        su->su_nblocks = cpu_to_le32(nblocks);
 540        kunmap_atomic(kaddr);
 541
 542        mark_buffer_dirty(bh);
 543        nilfs_mdt_mark_dirty(sufile);
 544        brelse(bh);
 545
 546 out_sem:
 547        up_write(&NILFS_MDT(sufile)->mi_sem);
 548        return ret;
 549}
 550
 551/**
 552 * nilfs_sufile_get_stat - get segment usage statistics
 553 * @sufile: inode of segment usage file
 554 * @stat: pointer to a structure of segment usage statistics
 555 *
 556 * Description: nilfs_sufile_get_stat() returns information about segment
 557 * usage.
 558 *
 559 * Return Value: On success, 0 is returned, and segment usage information is
 560 * stored in the place pointed by @stat. On error, one of the following
 561 * negative error codes is returned.
 562 *
 563 * %-EIO - I/O error.
 564 *
 565 * %-ENOMEM - Insufficient amount of memory available.
 566 */
 567int nilfs_sufile_get_stat(struct inode *sufile, struct nilfs_sustat *sustat)
 568{
 569        struct buffer_head *header_bh;
 570        struct nilfs_sufile_header *header;
 571        struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
 572        void *kaddr;
 573        int ret;
 574
 575        down_read(&NILFS_MDT(sufile)->mi_sem);
 576
 577        ret = nilfs_sufile_get_header_block(sufile, &header_bh);
 578        if (ret < 0)
 579                goto out_sem;
 580
 581        kaddr = kmap_atomic(header_bh->b_page);
 582        header = kaddr + bh_offset(header_bh);
 583        sustat->ss_nsegs = nilfs_sufile_get_nsegments(sufile);
 584        sustat->ss_ncleansegs = le64_to_cpu(header->sh_ncleansegs);
 585        sustat->ss_ndirtysegs = le64_to_cpu(header->sh_ndirtysegs);
 586        sustat->ss_ctime = nilfs->ns_ctime;
 587        sustat->ss_nongc_ctime = nilfs->ns_nongc_ctime;
 588        spin_lock(&nilfs->ns_last_segment_lock);
 589        sustat->ss_prot_seq = nilfs->ns_prot_seq;
 590        spin_unlock(&nilfs->ns_last_segment_lock);
 591        kunmap_atomic(kaddr);
 592        brelse(header_bh);
 593
 594 out_sem:
 595        up_read(&NILFS_MDT(sufile)->mi_sem);
 596        return ret;
 597}
 598
 599void nilfs_sufile_do_set_error(struct inode *sufile, __u64 segnum,
 600                               struct buffer_head *header_bh,
 601                               struct buffer_head *su_bh)
 602{
 603        struct nilfs_segment_usage *su;
 604        void *kaddr;
 605        int suclean;
 606
 607        kaddr = kmap_atomic(su_bh->b_page);
 608        su = nilfs_sufile_block_get_segment_usage(sufile, segnum, su_bh, kaddr);
 609        if (nilfs_segment_usage_error(su)) {
 610                kunmap_atomic(kaddr);
 611                return;
 612        }
 613        suclean = nilfs_segment_usage_clean(su);
 614        nilfs_segment_usage_set_error(su);
 615        kunmap_atomic(kaddr);
 616
 617        if (suclean) {
 618                nilfs_sufile_mod_counter(header_bh, -1, 0);
 619                NILFS_SUI(sufile)->ncleansegs--;
 620        }
 621        mark_buffer_dirty(su_bh);
 622        nilfs_mdt_mark_dirty(sufile);
 623}
 624
 625/**
 626  * nilfs_sufile_truncate_range - truncate range of segment array
 627  * @sufile: inode of segment usage file
 628  * @start: start segment number (inclusive)
 629  * @end: end segment number (inclusive)
 630  *
 631  * Return Value: On success, 0 is returned.  On error, one of the
 632  * following negative error codes is returned.
 633  *
 634  * %-EIO - I/O error.
 635  *
 636  * %-ENOMEM - Insufficient amount of memory available.
 637  *
 638  * %-EINVAL - Invalid number of segments specified
 639  *
 640  * %-EBUSY - Dirty or active segments are present in the range
 641  */
 642static int nilfs_sufile_truncate_range(struct inode *sufile,
 643                                       __u64 start, __u64 end)
 644{
 645        struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
 646        struct buffer_head *header_bh;
 647        struct buffer_head *su_bh;
 648        struct nilfs_segment_usage *su, *su2;
 649        size_t susz = NILFS_MDT(sufile)->mi_entry_size;
 650        unsigned long segusages_per_block;
 651        unsigned long nsegs, ncleaned;
 652        __u64 segnum;
 653        void *kaddr;
 654        ssize_t n, nc;
 655        int ret;
 656        int j;
 657
 658        nsegs = nilfs_sufile_get_nsegments(sufile);
 659
 660        ret = -EINVAL;
 661        if (start > end || start >= nsegs)
 662                goto out;
 663
 664        ret = nilfs_sufile_get_header_block(sufile, &header_bh);
 665        if (ret < 0)
 666                goto out;
 667
 668        segusages_per_block = nilfs_sufile_segment_usages_per_block(sufile);
 669        ncleaned = 0;
 670
 671        for (segnum = start; segnum <= end; segnum += n) {
 672                n = min_t(unsigned long,
 673                          segusages_per_block -
 674                                  nilfs_sufile_get_offset(sufile, segnum),
 675                          end - segnum + 1);
 676                ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0,
 677                                                           &su_bh);
 678                if (ret < 0) {
 679                        if (ret != -ENOENT)
 680                                goto out_header;
 681                        /* hole */
 682                        continue;
 683                }
 684                kaddr = kmap_atomic(su_bh->b_page);
 685                su = nilfs_sufile_block_get_segment_usage(
 686                        sufile, segnum, su_bh, kaddr);
 687                su2 = su;
 688                for (j = 0; j < n; j++, su = (void *)su + susz) {
 689                        if ((le32_to_cpu(su->su_flags) &
 690                             ~(1UL << NILFS_SEGMENT_USAGE_ERROR)) ||
 691                            nilfs_segment_is_active(nilfs, segnum + j)) {
 692                                ret = -EBUSY;
 693                                kunmap_atomic(kaddr);
 694                                brelse(su_bh);
 695                                goto out_header;
 696                        }
 697                }
 698                nc = 0;
 699                for (su = su2, j = 0; j < n; j++, su = (void *)su + susz) {
 700                        if (nilfs_segment_usage_error(su)) {
 701                                nilfs_segment_usage_set_clean(su);
 702                                nc++;
 703                        }
 704                }
 705                kunmap_atomic(kaddr);
 706                if (nc > 0) {
 707                        mark_buffer_dirty(su_bh);
 708                        ncleaned += nc;
 709                }
 710                brelse(su_bh);
 711
 712                if (n == segusages_per_block) {
 713                        /* make hole */
 714                        nilfs_sufile_delete_segment_usage_block(sufile, segnum);
 715                }
 716        }
 717        ret = 0;
 718
 719out_header:
 720        if (ncleaned > 0) {
 721                NILFS_SUI(sufile)->ncleansegs += ncleaned;
 722                nilfs_sufile_mod_counter(header_bh, ncleaned, 0);
 723                nilfs_mdt_mark_dirty(sufile);
 724        }
 725        brelse(header_bh);
 726out:
 727        return ret;
 728}
 729
 730/**
 731 * nilfs_sufile_resize - resize segment array
 732 * @sufile: inode of segment usage file
 733 * @newnsegs: new number of segments
 734 *
 735 * Return Value: On success, 0 is returned.  On error, one of the
 736 * following negative error codes is returned.
 737 *
 738 * %-EIO - I/O error.
 739 *
 740 * %-ENOMEM - Insufficient amount of memory available.
 741 *
 742 * %-ENOSPC - Enough free space is not left for shrinking
 743 *
 744 * %-EBUSY - Dirty or active segments exist in the region to be truncated
 745 */
 746int nilfs_sufile_resize(struct inode *sufile, __u64 newnsegs)
 747{
 748        struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
 749        struct buffer_head *header_bh;
 750        struct nilfs_sufile_header *header;
 751        struct nilfs_sufile_info *sui = NILFS_SUI(sufile);
 752        void *kaddr;
 753        unsigned long nsegs, nrsvsegs;
 754        int ret = 0;
 755
 756        down_write(&NILFS_MDT(sufile)->mi_sem);
 757
 758        nsegs = nilfs_sufile_get_nsegments(sufile);
 759        if (nsegs == newnsegs)
 760                goto out;
 761
 762        ret = -ENOSPC;
 763        nrsvsegs = nilfs_nrsvsegs(nilfs, newnsegs);
 764        if (newnsegs < nsegs && nsegs - newnsegs + nrsvsegs > sui->ncleansegs)
 765                goto out;
 766
 767        ret = nilfs_sufile_get_header_block(sufile, &header_bh);
 768        if (ret < 0)
 769                goto out;
 770
 771        if (newnsegs > nsegs) {
 772                sui->ncleansegs += newnsegs - nsegs;
 773        } else /* newnsegs < nsegs */ {
 774                ret = nilfs_sufile_truncate_range(sufile, newnsegs, nsegs - 1);
 775                if (ret < 0)
 776                        goto out_header;
 777
 778                sui->ncleansegs -= nsegs - newnsegs;
 779        }
 780
 781        kaddr = kmap_atomic(header_bh->b_page);
 782        header = kaddr + bh_offset(header_bh);
 783        header->sh_ncleansegs = cpu_to_le64(sui->ncleansegs);
 784        kunmap_atomic(kaddr);
 785
 786        mark_buffer_dirty(header_bh);
 787        nilfs_mdt_mark_dirty(sufile);
 788        nilfs_set_nsegments(nilfs, newnsegs);
 789
 790out_header:
 791        brelse(header_bh);
 792out:
 793        up_write(&NILFS_MDT(sufile)->mi_sem);
 794        return ret;
 795}
 796
 797/**
 798 * nilfs_sufile_get_suinfo -
 799 * @sufile: inode of segment usage file
 800 * @segnum: segment number to start looking
 801 * @buf: array of suinfo
 802 * @sisz: byte size of suinfo
 803 * @nsi: size of suinfo array
 804 *
 805 * Description:
 806 *
 807 * Return Value: On success, 0 is returned and .... On error, one of the
 808 * following negative error codes is returned.
 809 *
 810 * %-EIO - I/O error.
 811 *
 812 * %-ENOMEM - Insufficient amount of memory available.
 813 */
 814ssize_t nilfs_sufile_get_suinfo(struct inode *sufile, __u64 segnum, void *buf,
 815                                unsigned sisz, size_t nsi)
 816{
 817        struct buffer_head *su_bh;
 818        struct nilfs_segment_usage *su;
 819        struct nilfs_suinfo *si = buf;
 820        size_t susz = NILFS_MDT(sufile)->mi_entry_size;
 821        struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
 822        void *kaddr;
 823        unsigned long nsegs, segusages_per_block;
 824        ssize_t n;
 825        int ret, i, j;
 826
 827        down_read(&NILFS_MDT(sufile)->mi_sem);
 828
 829        segusages_per_block = nilfs_sufile_segment_usages_per_block(sufile);
 830        nsegs = min_t(unsigned long,
 831                      nilfs_sufile_get_nsegments(sufile) - segnum,
 832                      nsi);
 833        for (i = 0; i < nsegs; i += n, segnum += n) {
 834                n = min_t(unsigned long,
 835                          segusages_per_block -
 836                                  nilfs_sufile_get_offset(sufile, segnum),
 837                          nsegs - i);
 838                ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0,
 839                                                           &su_bh);
 840                if (ret < 0) {
 841                        if (ret != -ENOENT)
 842                                goto out;
 843                        /* hole */
 844                        memset(si, 0, sisz * n);
 845                        si = (void *)si + sisz * n;
 846                        continue;
 847                }
 848
 849                kaddr = kmap_atomic(su_bh->b_page);
 850                su = nilfs_sufile_block_get_segment_usage(
 851                        sufile, segnum, su_bh, kaddr);
 852                for (j = 0; j < n;
 853                     j++, su = (void *)su + susz, si = (void *)si + sisz) {
 854                        si->sui_lastmod = le64_to_cpu(su->su_lastmod);
 855                        si->sui_nblocks = le32_to_cpu(su->su_nblocks);
 856                        si->sui_flags = le32_to_cpu(su->su_flags) &
 857                                ~(1UL << NILFS_SEGMENT_USAGE_ACTIVE);
 858                        if (nilfs_segment_is_active(nilfs, segnum + j))
 859                                si->sui_flags |=
 860                                        (1UL << NILFS_SEGMENT_USAGE_ACTIVE);
 861                }
 862                kunmap_atomic(kaddr);
 863                brelse(su_bh);
 864        }
 865        ret = nsegs;
 866
 867 out:
 868        up_read(&NILFS_MDT(sufile)->mi_sem);
 869        return ret;
 870}
 871
 872/**
 873 * nilfs_sufile_set_suinfo - sets segment usage info
 874 * @sufile: inode of segment usage file
 875 * @buf: array of suinfo_update
 876 * @supsz: byte size of suinfo_update
 877 * @nsup: size of suinfo_update array
 878 *
 879 * Description: Takes an array of nilfs_suinfo_update structs and updates
 880 * segment usage accordingly. Only the fields indicated by the sup_flags
 881 * are updated.
 882 *
 883 * Return Value: On success, 0 is returned. On error, one of the
 884 * following negative error codes is returned.
 885 *
 886 * %-EIO - I/O error.
 887 *
 888 * %-ENOMEM - Insufficient amount of memory available.
 889 *
 890 * %-EINVAL - Invalid values in input (segment number, flags or nblocks)
 891 */
 892ssize_t nilfs_sufile_set_suinfo(struct inode *sufile, void *buf,
 893                                unsigned supsz, size_t nsup)
 894{
 895        struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
 896        struct buffer_head *header_bh, *bh;
 897        struct nilfs_suinfo_update *sup, *supend = buf + supsz * nsup;
 898        struct nilfs_segment_usage *su;
 899        void *kaddr;
 900        unsigned long blkoff, prev_blkoff;
 901        int cleansi, cleansu, dirtysi, dirtysu;
 902        long ncleaned = 0, ndirtied = 0;
 903        int ret = 0;
 904
 905        if (unlikely(nsup == 0))
 906                return ret;
 907
 908        for (sup = buf; sup < supend; sup = (void *)sup + supsz) {
 909                if (sup->sup_segnum >= nilfs->ns_nsegments
 910                        || (sup->sup_flags &
 911                                (~0UL << __NR_NILFS_SUINFO_UPDATE_FIELDS))
 912                        || (nilfs_suinfo_update_nblocks(sup) &&
 913                                sup->sup_sui.sui_nblocks >
 914                                nilfs->ns_blocks_per_segment))
 915                        return -EINVAL;
 916        }
 917
 918        down_write(&NILFS_MDT(sufile)->mi_sem);
 919
 920        ret = nilfs_sufile_get_header_block(sufile, &header_bh);
 921        if (ret < 0)
 922                goto out_sem;
 923
 924        sup = buf;
 925        blkoff = nilfs_sufile_get_blkoff(sufile, sup->sup_segnum);
 926        ret = nilfs_mdt_get_block(sufile, blkoff, 1, NULL, &bh);
 927        if (ret < 0)
 928                goto out_header;
 929
 930        for (;;) {
 931                kaddr = kmap_atomic(bh->b_page);
 932                su = nilfs_sufile_block_get_segment_usage(
 933                        sufile, sup->sup_segnum, bh, kaddr);
 934
 935                if (nilfs_suinfo_update_lastmod(sup))
 936                        su->su_lastmod = cpu_to_le64(sup->sup_sui.sui_lastmod);
 937
 938                if (nilfs_suinfo_update_nblocks(sup))
 939                        su->su_nblocks = cpu_to_le32(sup->sup_sui.sui_nblocks);
 940
 941                if (nilfs_suinfo_update_flags(sup)) {
 942                        /*
 943                         * Active flag is a virtual flag projected by running
 944                         * nilfs kernel code - drop it not to write it to
 945                         * disk.
 946                         */
 947                        sup->sup_sui.sui_flags &=
 948                                        ~(1UL << NILFS_SEGMENT_USAGE_ACTIVE);
 949
 950                        cleansi = nilfs_suinfo_clean(&sup->sup_sui);
 951                        cleansu = nilfs_segment_usage_clean(su);
 952                        dirtysi = nilfs_suinfo_dirty(&sup->sup_sui);
 953                        dirtysu = nilfs_segment_usage_dirty(su);
 954
 955                        if (cleansi && !cleansu)
 956                                ++ncleaned;
 957                        else if (!cleansi && cleansu)
 958                                --ncleaned;
 959
 960                        if (dirtysi && !dirtysu)
 961                                ++ndirtied;
 962                        else if (!dirtysi && dirtysu)
 963                                --ndirtied;
 964
 965                        su->su_flags = cpu_to_le32(sup->sup_sui.sui_flags);
 966                }
 967
 968                kunmap_atomic(kaddr);
 969
 970                sup = (void *)sup + supsz;
 971                if (sup >= supend)
 972                        break;
 973
 974                prev_blkoff = blkoff;
 975                blkoff = nilfs_sufile_get_blkoff(sufile, sup->sup_segnum);
 976                if (blkoff == prev_blkoff)
 977                        continue;
 978
 979                /* get different block */
 980                mark_buffer_dirty(bh);
 981                put_bh(bh);
 982                ret = nilfs_mdt_get_block(sufile, blkoff, 1, NULL, &bh);
 983                if (unlikely(ret < 0))
 984                        goto out_mark;
 985        }
 986        mark_buffer_dirty(bh);
 987        put_bh(bh);
 988
 989 out_mark:
 990        if (ncleaned || ndirtied) {
 991                nilfs_sufile_mod_counter(header_bh, (u64)ncleaned,
 992                                (u64)ndirtied);
 993                NILFS_SUI(sufile)->ncleansegs += ncleaned;
 994        }
 995        nilfs_mdt_mark_dirty(sufile);
 996 out_header:
 997        put_bh(header_bh);
 998 out_sem:
 999        up_write(&NILFS_MDT(sufile)->mi_sem);
1000        return ret;
1001}
1002
1003/**
1004 * nilfs_sufile_trim_fs() - trim ioctl handle function
1005 * @sufile: inode of segment usage file
1006 * @range: fstrim_range structure
1007 *
1008 * start:       First Byte to trim
1009 * len:         number of Bytes to trim from start
1010 * minlen:      minimum extent length in Bytes
1011 *
1012 * Decription: nilfs_sufile_trim_fs goes through all segments containing bytes
1013 * from start to start+len. start is rounded up to the next block boundary
1014 * and start+len is rounded down. For each clean segment blkdev_issue_discard
1015 * function is invoked.
1016 *
1017 * Return Value: On success, 0 is returned or negative error code, otherwise.
1018 */
1019int nilfs_sufile_trim_fs(struct inode *sufile, struct fstrim_range *range)
1020{
1021        struct the_nilfs *nilfs = sufile->i_sb->s_fs_info;
1022        struct buffer_head *su_bh;
1023        struct nilfs_segment_usage *su;
1024        void *kaddr;
1025        size_t n, i, susz = NILFS_MDT(sufile)->mi_entry_size;
1026        sector_t seg_start, seg_end, start_block, end_block;
1027        sector_t start = 0, nblocks = 0;
1028        u64 segnum, segnum_end, minlen, len, max_blocks, ndiscarded = 0;
1029        int ret = 0;
1030        unsigned int sects_per_block;
1031
1032        sects_per_block = (1 << nilfs->ns_blocksize_bits) /
1033                        bdev_logical_block_size(nilfs->ns_bdev);
1034        len = range->len >> nilfs->ns_blocksize_bits;
1035        minlen = range->minlen >> nilfs->ns_blocksize_bits;
1036        max_blocks = ((u64)nilfs->ns_nsegments * nilfs->ns_blocks_per_segment);
1037
1038        if (!len || range->start >= max_blocks << nilfs->ns_blocksize_bits)
1039                return -EINVAL;
1040
1041        start_block = (range->start + nilfs->ns_blocksize - 1) >>
1042                        nilfs->ns_blocksize_bits;
1043
1044        /*
1045         * range->len can be very large (actually, it is set to
1046         * ULLONG_MAX by default) - truncate upper end of the range
1047         * carefully so as not to overflow.
1048         */
1049        if (max_blocks - start_block < len)
1050                end_block = max_blocks - 1;
1051        else
1052                end_block = start_block + len - 1;
1053
1054        segnum = nilfs_get_segnum_of_block(nilfs, start_block);
1055        segnum_end = nilfs_get_segnum_of_block(nilfs, end_block);
1056
1057        down_read(&NILFS_MDT(sufile)->mi_sem);
1058
1059        while (segnum <= segnum_end) {
1060                n = nilfs_sufile_segment_usages_in_block(sufile, segnum,
1061                                segnum_end);
1062
1063                ret = nilfs_sufile_get_segment_usage_block(sufile, segnum, 0,
1064                                                           &su_bh);
1065                if (ret < 0) {
1066                        if (ret != -ENOENT)
1067                                goto out_sem;
1068                        /* hole */
1069                        segnum += n;
1070                        continue;
1071                }
1072
1073                kaddr = kmap_atomic(su_bh->b_page);
1074                su = nilfs_sufile_block_get_segment_usage(sufile, segnum,
1075                                su_bh, kaddr);
1076                for (i = 0; i < n; ++i, ++segnum, su = (void *)su + susz) {
1077                        if (!nilfs_segment_usage_clean(su))
1078                                continue;
1079
1080                        nilfs_get_segment_range(nilfs, segnum, &seg_start,
1081                                                &seg_end);
1082
1083                        if (!nblocks) {
1084                                /* start new extent */
1085                                start = seg_start;
1086                                nblocks = seg_end - seg_start + 1;
1087                                continue;
1088                        }
1089
1090                        if (start + nblocks == seg_start) {
1091                                /* add to previous extent */
1092                                nblocks += seg_end - seg_start + 1;
1093                                continue;
1094                        }
1095
1096                        /* discard previous extent */
1097                        if (start < start_block) {
1098                                nblocks -= start_block - start;
1099                                start = start_block;
1100                        }
1101
1102                        if (nblocks >= minlen) {
1103                                kunmap_atomic(kaddr);
1104
1105                                ret = blkdev_issue_discard(nilfs->ns_bdev,
1106                                                start * sects_per_block,
1107                                                nblocks * sects_per_block,
1108                                                GFP_NOFS, 0);
1109                                if (ret < 0) {
1110                                        put_bh(su_bh);
1111                                        goto out_sem;
1112                                }
1113
1114                                ndiscarded += nblocks;
1115                                kaddr = kmap_atomic(su_bh->b_page);
1116                                su = nilfs_sufile_block_get_segment_usage(
1117                                        sufile, segnum, su_bh, kaddr);
1118                        }
1119
1120                        /* start new extent */
1121                        start = seg_start;
1122                        nblocks = seg_end - seg_start + 1;
1123                }
1124                kunmap_atomic(kaddr);
1125                put_bh(su_bh);
1126        }
1127
1128
1129        if (nblocks) {
1130                /* discard last extent */
1131                if (start < start_block) {
1132                        nblocks -= start_block - start;
1133                        start = start_block;
1134                }
1135                if (start + nblocks > end_block + 1)
1136                        nblocks = end_block - start + 1;
1137
1138                if (nblocks >= minlen) {
1139                        ret = blkdev_issue_discard(nilfs->ns_bdev,
1140                                        start * sects_per_block,
1141                                        nblocks * sects_per_block,
1142                                        GFP_NOFS, 0);
1143                        if (!ret)
1144                                ndiscarded += nblocks;
1145                }
1146        }
1147
1148out_sem:
1149        up_read(&NILFS_MDT(sufile)->mi_sem);
1150
1151        range->len = ndiscarded << nilfs->ns_blocksize_bits;
1152        return ret;
1153}
1154
1155/**
1156 * nilfs_sufile_read - read or get sufile inode
1157 * @sb: super block instance
1158 * @susize: size of a segment usage entry
1159 * @raw_inode: on-disk sufile inode
1160 * @inodep: buffer to store the inode
1161 */
1162int nilfs_sufile_read(struct super_block *sb, size_t susize,
1163                      struct nilfs_inode *raw_inode, struct inode **inodep)
1164{
1165        struct inode *sufile;
1166        struct nilfs_sufile_info *sui;
1167        struct buffer_head *header_bh;
1168        struct nilfs_sufile_header *header;
1169        void *kaddr;
1170        int err;
1171
1172        if (susize > sb->s_blocksize) {
1173                printk(KERN_ERR
1174                       "NILFS: too large segment usage size: %zu bytes.\n",
1175                       susize);
1176                return -EINVAL;
1177        } else if (susize < NILFS_MIN_SEGMENT_USAGE_SIZE) {
1178                printk(KERN_ERR
1179                       "NILFS: too small segment usage size: %zu bytes.\n",
1180                       susize);
1181                return -EINVAL;
1182        }
1183
1184        sufile = nilfs_iget_locked(sb, NULL, NILFS_SUFILE_INO);
1185        if (unlikely(!sufile))
1186                return -ENOMEM;
1187        if (!(sufile->i_state & I_NEW))
1188                goto out;
1189
1190        err = nilfs_mdt_init(sufile, NILFS_MDT_GFP, sizeof(*sui));
1191        if (err)
1192                goto failed;
1193
1194        nilfs_mdt_set_entry_size(sufile, susize,
1195                                 sizeof(struct nilfs_sufile_header));
1196
1197        err = nilfs_read_inode_common(sufile, raw_inode);
1198        if (err)
1199                goto failed;
1200
1201        err = nilfs_sufile_get_header_block(sufile, &header_bh);
1202        if (err)
1203                goto failed;
1204
1205        sui = NILFS_SUI(sufile);
1206        kaddr = kmap_atomic(header_bh->b_page);
1207        header = kaddr + bh_offset(header_bh);
1208        sui->ncleansegs = le64_to_cpu(header->sh_ncleansegs);
1209        kunmap_atomic(kaddr);
1210        brelse(header_bh);
1211
1212        sui->allocmax = nilfs_sufile_get_nsegments(sufile) - 1;
1213        sui->allocmin = 0;
1214
1215        unlock_new_inode(sufile);
1216 out:
1217        *inodep = sufile;
1218        return 0;
1219 failed:
1220        iget_failed(sufile);
1221        return err;
1222}
1223