Re: [PATCH 3/4] ceph: simplify calling of ceph_get_fmode()

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

 



On Fri, 2020-02-21 at 10:34 +0800, Yan, Zheng wrote:
> On Fri, Feb 21, 2020 at 3:15 AM Jeff Layton <jlayton@xxxxxxxxxx> wrote:
> > On Thu, 2020-02-20 at 20:26 +0800, Yan, Zheng wrote:
> > > Call ceph_get_fmode() when initializing file. Because fill_inode()
> > > already calls ceph_touch_fmode() for open file request. It affects
> > 
> > You mean __ceph_touch_fmode()
> > 
> > > __ceph_caps_file_wanted() for 'caps_wanted_delay_min' seconds, enough
> > > for ceph_get_fmode() to get called by ceph_init_file_info().
> > > 
> > 
> > I don't understand this changelog. Are you saying there is a potential
> > race of some sort, but that you don't think it's something we can hit in
> > practice?
> > 
> 
> threads run handle_reply() and open request initiator are different.
> there is a small window between waking up request initiator and
> request initiator calls ceph_get_fmode(). someone else may call
> ceph_check_caps() in the window and wrongly release wanted caps. This
> is the reason old code calls _ceph_get_fmode() in fill_inode().
> 
> 

Ok. So how are you addressing this race in this series? Is it just that
we now hold on to caps for a minimal amount of time, and we just assume
that ceph_get_fmode will be called before they can expire?

> > > Signed-off-by: "Yan, Zheng" <zyan@xxxxxxxxxx>
> > > ---
> > >  fs/ceph/caps.c  | 26 +++-----------------------
> > >  fs/ceph/file.c  | 21 +++++----------------
> > >  fs/ceph/inode.c |  8 +-------
> > >  fs/ceph/super.h |  3 +--
> > >  4 files changed, 10 insertions(+), 48 deletions(-)
> > > 
> > > diff --git a/fs/ceph/caps.c b/fs/ceph/caps.c
> > > index ccdc47bd7cf0..2f4ff7e9508e 100644
> > > --- a/fs/ceph/caps.c
> > > +++ b/fs/ceph/caps.c
> > > @@ -606,7 +606,7 @@ static void __check_cap_issue(struct ceph_inode_info *ci, struct ceph_cap *cap,
> > >   */
> > >  void ceph_add_cap(struct inode *inode,
> > >                 struct ceph_mds_session *session, u64 cap_id,
> > > -               int fmode, unsigned issued, unsigned wanted,
> > > +               unsigned issued, unsigned wanted,
> > >                 unsigned seq, unsigned mseq, u64 realmino, int flags,
> > >                 struct ceph_cap **new_cap)
> > >  {
> > > @@ -622,13 +622,6 @@ void ceph_add_cap(struct inode *inode,
> > >       dout("add_cap %p mds%d cap %llx %s seq %d\n", inode,
> > >            session->s_mds, cap_id, ceph_cap_string(issued), seq);
> > > 
> > > -     /*
> > > -      * If we are opening the file, include file mode wanted bits
> > > -      * in wanted.
> > > -      */
> > > -     if (fmode >= 0)
> > > -             wanted |= ceph_caps_for_mode(fmode);
> > > -
> > >       spin_lock(&session->s_gen_ttl_lock);
> > >       gen = session->s_cap_gen;
> > >       spin_unlock(&session->s_gen_ttl_lock);
> > > @@ -753,9 +746,6 @@ void ceph_add_cap(struct inode *inode,
> > >       cap->issue_seq = seq;
> > >       cap->mseq = mseq;
> > >       cap->cap_gen = gen;
> > > -
> > > -     if (fmode >= 0)
> > > -             __ceph_get_fmode(ci, fmode);
> > >  }
> > > 
> > >  /*
> > > @@ -3726,7 +3716,7 @@ static void handle_cap_export(struct inode *inode, struct ceph_mds_caps *ex,
> > >               /* add placeholder for the export tagert */
> > >               int flag = (cap == ci->i_auth_cap) ? CEPH_CAP_FLAG_AUTH : 0;
> > >               tcap = new_cap;
> > > -             ceph_add_cap(inode, tsession, t_cap_id, -1, issued, 0,
> > > +             ceph_add_cap(inode, tsession, t_cap_id, issued, 0,
> > >                            t_seq - 1, t_mseq, (u64)-1, flag, &new_cap);
> > > 
> > >               if (!list_empty(&ci->i_cap_flush_list) &&
> > > @@ -3831,7 +3821,7 @@ static void handle_cap_import(struct ceph_mds_client *mdsc,
> > >       __ceph_caps_issued(ci, &issued);
> > >       issued |= __ceph_caps_dirty(ci);
> > > 
> > > -     ceph_add_cap(inode, session, cap_id, -1, caps, wanted, seq, mseq,
> > > +     ceph_add_cap(inode, session, cap_id, caps, wanted, seq, mseq,
> > >                    realmino, CEPH_CAP_FLAG_AUTH, &new_cap);
> > > 
> > >       ocap = peer >= 0 ? __get_cap_for_mds(ci, peer) : NULL;
> > > @@ -4186,16 +4176,6 @@ void ceph_get_fmode(struct ceph_inode_info *ci, int fmode, int count)
> > >       spin_unlock(&ci->i_ceph_lock);
> > >  }
> > > 
> > > -void __ceph_get_fmode(struct ceph_inode_info *ci, int fmode)
> > > -{
> > > -     int i;
> > > -     int bits = (fmode << 1) | 1;
> > > -     for (i = 0; i < CEPH_FILE_MODE_BITS; i++) {
> > > -             if (bits & (1 << i))
> > > -                     ci->i_file_by_mode[i].nr++;
> > > -     }
> > > -}
> > > -
> > >  /*
> > >   * Drop open file reference.  If we were the last open file,
> > >   * we may need to release capabilities to the MDS (or schedule
> > > diff --git a/fs/ceph/file.c b/fs/ceph/file.c
> > > index f28f420bad23..60a2dfa02ba2 100644
> > > --- a/fs/ceph/file.c
> > > +++ b/fs/ceph/file.c
> > > @@ -212,10 +212,8 @@ static int ceph_init_file_info(struct inode *inode, struct file *file,
> > >       if (isdir) {
> > >               struct ceph_dir_file_info *dfi =
> > >                       kmem_cache_zalloc(ceph_dir_file_cachep, GFP_KERNEL);
> > > -             if (!dfi) {
> > > -                     ceph_put_fmode(ci, fmode, 1); /* clean up */
> > > +             if (!dfi)
> > >                       return -ENOMEM;
> > > -             }
> > > 
> > >               file->private_data = dfi;
> > >               fi = &dfi->file_info;
> > > @@ -223,15 +221,15 @@ static int ceph_init_file_info(struct inode *inode, struct file *file,
> > >               dfi->readdir_cache_idx = -1;
> > >       } else {
> > >               fi = kmem_cache_zalloc(ceph_file_cachep, GFP_KERNEL);
> > > -             if (!fi) {
> > > -                     ceph_put_fmode(ci, fmode, 1); /* clean up */
> > > +             if (!fi)
> > >                       return -ENOMEM;
> > > -             }
> > > 
> > >               file->private_data = fi;
> > >       }
> > > 
> > > +     ceph_get_fmode(ci, fmode, 1);
> > >       fi->fmode = fmode;
> > > +
> > >       spin_lock_init(&fi->rw_contexts_lock);
> > >       INIT_LIST_HEAD(&fi->rw_contexts);
> > >       fi->meta_err = errseq_sample(&ci->i_meta_err);
> > > @@ -263,7 +261,6 @@ static int ceph_init_file(struct inode *inode, struct file *file, int fmode)
> > >       case S_IFLNK:
> > >               dout("init_file %p %p 0%o (symlink)\n", inode, file,
> > >                    inode->i_mode);
> > > -             ceph_put_fmode(ceph_inode(inode), fmode, 1); /* clean up */
> > >               break;
> > > 
> > >       default:
> > > @@ -273,7 +270,6 @@ static int ceph_init_file(struct inode *inode, struct file *file, int fmode)
> > >                * we need to drop the open ref now, since we don't
> > >                * have .release set to ceph_release.
> > >                */
> > > -             ceph_put_fmode(ceph_inode(inode), fmode, 1); /* clean up */
> > >               BUG_ON(inode->i_fop->release == ceph_release);
> > > 
> > >               /* call the proper open fop */
> > > @@ -327,7 +323,6 @@ int ceph_renew_caps(struct inode *inode, int fmode)
> > >       req->r_inode = inode;
> > >       ihold(inode);
> > >       req->r_num_caps = 1;
> > > -     req->r_fmode = -1;
> > > 
> > >       err = ceph_mdsc_do_request(mdsc, NULL, req);
> > >       ceph_mdsc_put_request(req);
> > > @@ -373,9 +368,6 @@ int ceph_open(struct inode *inode, struct file *file)
> > > 
> > >       /* trivially open snapdir */
> > >       if (ceph_snap(inode) == CEPH_SNAPDIR) {
> > > -             spin_lock(&ci->i_ceph_lock);
> > > -             __ceph_get_fmode(ci, fmode);
> > > -             spin_unlock(&ci->i_ceph_lock);
> > >               return ceph_init_file(inode, file, fmode);
> > >       }
> > > 
> > > @@ -393,7 +385,7 @@ int ceph_open(struct inode *inode, struct file *file)
> > >               dout("open %p fmode %d want %s issued %s using existing\n",
> > >                    inode, fmode, ceph_cap_string(wanted),
> > >                    ceph_cap_string(issued));
> > > -             __ceph_get_fmode(ci, fmode);
> > > +             __ceph_touch_fmode(ci, mdsc, fmode);
> > >               spin_unlock(&ci->i_ceph_lock);
> > > 
> > >               /* adjust wanted? */
> > > @@ -405,7 +397,6 @@ int ceph_open(struct inode *inode, struct file *file)
> > >               return ceph_init_file(inode, file, fmode);
> > >       } else if (ceph_snap(inode) != CEPH_NOSNAP &&
> > >                  (ci->i_snap_caps & wanted) == wanted) {
> > > -             __ceph_get_fmode(ci, fmode);
> > >               __ceph_touch_fmode(ci, mdsc, fmode);
> > >               spin_unlock(&ci->i_ceph_lock);
> > >               return ceph_init_file(inode, file, fmode);
> > > @@ -526,8 +517,6 @@ int ceph_atomic_open(struct inode *dir, struct dentry *dentry,
> > >               err = finish_open(file, dentry, ceph_open);
> > >       }
> > >  out_req:
> > > -     if (!req->r_err && req->r_target_inode)
> > > -             ceph_put_fmode(ceph_inode(req->r_target_inode), req->r_fmode, 1);
> > >       ceph_mdsc_put_request(req);
> > >  out_ctx:
> > >       ceph_release_acl_sec_ctx(&as_ctx);
> > > diff --git a/fs/ceph/inode.c b/fs/ceph/inode.c
> > > index b279bd8e168e..bb73b0c8c4d9 100644
> > > --- a/fs/ceph/inode.c
> > > +++ b/fs/ceph/inode.c
> > > @@ -969,7 +969,7 @@ static int fill_inode(struct inode *inode, struct page *locked_page,
> > >               if (ceph_snap(inode) == CEPH_NOSNAP) {
> > >                       ceph_add_cap(inode, session,
> > >                                    le64_to_cpu(info->cap.cap_id),
> > > -                                  cap_fmode, info_caps,
> > > +                                  info_caps,
> > >                                    le32_to_cpu(info->cap.wanted),
> > >                                    le32_to_cpu(info->cap.seq),
> > >                                    le32_to_cpu(info->cap.mseq),
> > > @@ -994,13 +994,7 @@ static int fill_inode(struct inode *inode, struct page *locked_page,
> > >                       dout(" %p got snap_caps %s\n", inode,
> > >                            ceph_cap_string(info_caps));
> > >                       ci->i_snap_caps |= info_caps;
> > > -                     if (cap_fmode >= 0)
> > > -                             __ceph_get_fmode(ci, cap_fmode);
> > >               }
> > > -     } else if (cap_fmode >= 0) {
> > > -             pr_warn("mds issued no caps on %llx.%llx\n",
> > > -                        ceph_vinop(inode));
> > > -             __ceph_get_fmode(ci, cap_fmode);
> > >       }
> > > 
> > >       if (iinfo->inline_version > 0 &&
> > > diff --git a/fs/ceph/super.h b/fs/ceph/super.h
> > > index 029823643b8b..1ea76466efcb 100644
> > > --- a/fs/ceph/super.h
> > > +++ b/fs/ceph/super.h
> > > @@ -1038,7 +1038,7 @@ extern struct ceph_cap *ceph_get_cap(struct ceph_mds_client *mdsc,
> > >                                    struct ceph_cap_reservation *ctx);
> > >  extern void ceph_add_cap(struct inode *inode,
> > >                        struct ceph_mds_session *session, u64 cap_id,
> > > -                      int fmode, unsigned issued, unsigned wanted,
> > > +                      unsigned issued, unsigned wanted,
> > >                        unsigned cap, unsigned seq, u64 realmino, int flags,
> > >                        struct ceph_cap **new_cap);
> > >  extern void __ceph_remove_cap(struct ceph_cap *cap, bool queue_release);
> > > @@ -1080,7 +1080,6 @@ extern int ceph_try_get_caps(struct inode *inode,
> > >                            int need, int want, bool nonblock, int *got);
> > > 
> > >  /* for counting open files by mode */
> > > -extern void __ceph_get_fmode(struct ceph_inode_info *ci, int mode);
> > >  extern void ceph_get_fmode(struct ceph_inode_info *ci, int mode, int count);
> > >  extern void ceph_put_fmode(struct ceph_inode_info *ci, int mode, int count);
> > >  extern void __ceph_touch_fmode(struct ceph_inode_info *ci,
> > 
> > --
> > Jeff Layton <jlayton@xxxxxxxxxx>
> > 

-- 
Jeff Layton <jlayton@xxxxxxxxxx>




[Index of Archives]     [CEPH Users]     [Ceph Large]     [Ceph Dev]     [Information on CEPH]     [Linux BTRFS]     [Linux USB Devel]     [Video for Linux]     [Linux Audio Users]     [Yosemite News]     [Linux Kernel]     [Linux SCSI]

  Powered by Linux