On Tue, Mar 15, 2011 at 3:34 PM, Jeff Layton <[email protected]> wrote:
> On Tue, 8 Mar 2011 22:34:51 -0600
> [email protected] wrote:
>
>> From: Shirish Pargaonkar <[email protected]>
>>
>>
>> rb tree search and insertion routines.
>>
>> A SID which needs to be mapped, is looked up in one of the rb trees
>> depending whether SID is either owner or group SID.
>> If found in the tree, a (mapped) id from that node is assigned to
>> uid or gid as appropriate. If upcall returns an error, mapping
>> is retried after a timeout period.
>>
>> Otherwise, an node is inserted in the tree and a mapping id for
>> that SID is looked-up with the help of Winbind via upcall mechanism.
>> If, for whatever reasons, winbind calls return error, SID for an
>> owner is mapped to 'nobody' and SID for a group is mapped to 'nogroup'.
>>
>> To map a SID, which can be either a Owner SID or a Group SID, key
>> description starts with the string "os" or "gs" followed by SID converted
>> to a string. Without "os" or "gs", cifs.upcall does not know whether
>> SID needs to be mapped to either an uid or a gid.
>>
>> Nodes in rb tree as fields to prevent multiple upcalls for
>> a SID. Adding and removing nodes is done within global locks.
>> shrinker routine does not prune a node if mapping for that node
>> is either pending or or node was recently created (before timeout
>> period expires and node could be purged). The timeout period should
>> be long enough at least for an upcall to return back to cifs.
>>
>> For now, cifs.upcall is only used to map a SID to an id (uid or gid) but
>> it would be used to obtain an SID (string) for an id.
>>
>>
>> Signed-off-by: Shirish Pargaonkar <[email protected]>
>> ---
>> fs/cifs/cifsacl.c | 326
>> +++++++++++++++++++++++++++++++++++++++++++++++++----
>> fs/cifs/cifsacl.h | 23 ++++
>> 2 files changed, 325 insertions(+), 24 deletions(-)
>>
>> diff --git a/fs/cifs/cifsacl.c b/fs/cifs/cifsacl.c
>> index fc1ec64..aea06ef 100644
>> --- a/fs/cifs/cifsacl.c
>> +++ b/fs/cifs/cifsacl.c
>> @@ -54,7 +54,31 @@ static const struct cifs_sid sid_authusers = {
>> /* group users */
>> static const struct cifs_sid sid_user = {1, 2 , {0, 0, 0, 0, 0, 5}, {} };
>>
>> -static const struct cred *root_cred;
>> +const struct cred *root_cred;
>> +
>> +void
>> +shrink_idmap_tree(struct rb_root *root, int nr_to_scan, int *nr_rem,
>> + int *nr_del)
>> +{
>> + struct rb_node *node;
>> + struct rb_node *tmp;
>> + struct cifs_sid_id *psidid;
>> +
>> + node = rb_first(root);
>> + while (node) {
>> + tmp = node;
>> + node = rb_next(tmp);
>> + psidid = rb_entry(tmp, struct cifs_sid_id, rbnode);
>> + if (time_after(psidid->time + SID_MAP_EXPIRE, jiffies) ||
>> + test_bit(SID_ID_PENDING, &psidid->state) ||
>> + (nr_to_scan == 0) || (*nr_del == nr_to_scan))
>> + ++(*nr_rem);
>> + else {
>> + rb_erase(tmp, root);
>> + ++(*nr_del);
>> + }
>> + }
>> +}
>>
>> /*
>> * Run idmap cache shrinker.
>> @@ -62,11 +86,24 @@ static const struct cred *root_cred;
>> static int
>> cifs_idmap_shrinker(struct shrinker *shrink, int nr_to_scan, gfp_t gfp_mask)
>> {
>> - /* Use a pruning scheme in a subsequent patch instead */
>> - cifs_destroy_idmaptrees();
>> - return 0;
>> + int nr_del = 0;
>> + int nr_rem = 0;
>> + struct rb_root *root;
>> +
>> + root = &uidtree;
>> + spin_lock(&siduidlock);
>> + shrink_idmap_tree(root, nr_to_scan, &nr_rem, &nr_del);
>> + spin_unlock(&siduidlock);
>> +
>> + root = &gidtree;
>> + spin_lock(&sidgidlock);
>> + shrink_idmap_tree(root, nr_to_scan, &nr_rem, &nr_del);
>> + spin_unlock(&sidgidlock);
>> +
>> + return nr_rem;
>> }
>>
>> +
>> static struct shrinker cifs_shrinker = {
>> .shrink = cifs_idmap_shrinker,
>> .seeks = DEFAULT_SEEKS,
>> @@ -92,7 +129,6 @@ cifs_idmap_key_destroy(struct key *key)
>> kfree(key->payload.data);
>> }
>>
>> -static
>> struct key_type cifs_idmap_key_type = {
>> .name = "cifs.cifs_idmap",
>> .instantiate = cifs_idmap_key_instantiate,
>> @@ -101,6 +137,222 @@ struct key_type cifs_idmap_key_type = {
>> .match = user_match,
>> };
>>
>> +static struct cifs_sid_id *
>> +id_rb_lookup(struct rb_root *root, struct cifs_sid *sidptr,
>> + struct rb_node **sparent, struct rb_node ***slinkto)
>> +{
>> + int rc;
>> + struct cifs_sid_id *lsidid;
>> + struct rb_node *node = root->rb_node;
>> + struct rb_node *parent = NULL;
>> + struct rb_node **linkto = &(root->rb_node);
>> +
>> + while (node) {
>> + lsidid = rb_entry(node, struct cifs_sid_id, rbnode);
>> + parent = node;
>> + rc = compare_sids(sidptr, &((lsidid)->sid));
>> + if (rc > 0) {
>> + linkto = &(node->rb_left);
>> + node = node->rb_left;
>> + } else if (rc < 0) {
>> + linkto = &(node->rb_right);
>> + node = node->rb_right;
>> + } else /* node found */
>> + return lsidid;
>> + }
>> + if (sparent && slinkto) {
>> + *sparent = parent;
>> + *slinkto = linkto;
>> + }
>> +
>> + return NULL;
>> +}
>> +
>> +static struct cifs_sid_id *
>> +id_rb_add(struct rb_root *root, struct cifs_sid *sidptr, bool *sidmap,
>> + struct cifs_sid_id **psidid)
>> +{
>> + struct cifs_sid_id *lsidid;
>> + struct rb_node *parent;
>> + struct rb_node **linkto;
>> +
>> + lsidid = id_rb_lookup(root, sidptr, &parent, &linkto);
>> + if (!lsidid) { /* node did not happen to get added, so add it */
>> + *sidmap = false;
>> + memcpy(&(*psidid)->sid, sidptr, sizeof(struct cifs_sid));
>> + set_bit(SID_ID_PENDING, &(*psidid)->state);
>> + set_bit(SID_ID_UNMAPPED, &(*psidid)->state);
>> +
>> + rb_link_node(&(*psidid)->rbnode, parent, linkto);
>> + rb_insert_color(&(*psidid)->rbnode, root);
>> + }
>> +
>> + return lsidid;
>> +}
>> +
>> +static struct cifs_sid_id *
>> +id_rb_search(struct rb_root *root, struct cifs_sid *sidptr, bool *sidmap)
>> +{
>> + struct cifs_sid_id *lsidid;
>> +
>> + lsidid = id_rb_lookup(root, sidptr, NULL, NULL);
>> + if (lsidid) { /* node found */
>> + if (test_bit(SID_ID_UNMAPPED, &(lsidid)->state) &&
>> + !time_after((lsidid)->retry + SID_MAP_RETRY,
>> + jiffies)) { /* unmapped SID */
>> + if (!test_and_set_bit(SID_ID_PENDING,
>> &(lsidid)->state))
>> + *sidmap = false; /* get to retry mapping */
>> + }
>> + }
>> +
>> + return lsidid;
>> +}
>> +
>> +static void
>> +sid_to_str(struct cifs_sid *sidptr, char *sidstr)
>> +{
>> + int i;
>> + unsigned long saval;
>> + char *strptr;
>> +
>> + strptr = sidstr;
>> +
>> + sprintf(strptr, "%s", "S");
>> + strptr = sidstr + strlen(sidstr);
>> +
>> + sprintf(strptr, "-%d", sidptr->revision);
>> + strptr = sidstr + strlen(sidstr);
>> +
>> + for (i = 0; i < 6; ++i) {
>> + if (sidptr->authority[i]) {
>> + sprintf(strptr, "-%d", sidptr->authority[i]);
>> + strptr = sidstr + strlen(sidstr);
>> + }
>> + }
>> +
>> + for (i = 0; i < sidptr->num_subauth; ++i) {
>> + saval = le32_to_cpu(sidptr->sub_auth[i]);
>> + sprintf(strptr, "-%ld", saval);
>> + strptr = sidstr + strlen(sidstr);
>> + }
>> +}
>> +
>> +static int
>> +cifs_sid_pending_wait(void *unused)
>> +{
>> + schedule();
>> + return signal_pending(current) ? -ERESTARTSYS : 0;
>> +}
>> +
>> +static int
>> +sid_to_id(struct cifs_sb_info *cifs_sb, struct cifs_sid *psid,
>> + struct cifs_fattr *fattr, uint sidtype)
>> +{
>> + int rc;
>> + unsigned long id;
>> + bool sidmap = true;
>> + char *strptr;
>> + char *sidstr;
>> + struct key *idkey;
>> + const struct cred *saved_cred;
>> + struct cifs_sid_id *psidid = NULL;
>> + struct cifs_sid_id *epsidid = NULL;
>> +
>> + if (sidtype != SIDOWNER && sidtype != SIDGROUP)
>> + return -ENOENT;
>> +
>> + if (sidtype == SIDOWNER) {
>> + id = cifs_sb->mnt_uid;
>> + spin_lock(&siduidlock);
>> + psidid = id_rb_search(&uidtree, psid, &sidmap);
>> + spin_unlock(&siduidlock);
>> + } else {
>> + id = cifs_sb->mnt_gid;
>> + spin_lock(&sidgidlock);
>> + psidid = id_rb_search(&gidtree, psid, &sidmap);
>> + spin_unlock(&sidgidlock);
>> + }
>> +
>> + if (!psidid) { /* node does not exist, allocate one & attempt adding */
>> + epsidid = kzalloc(sizeof(struct cifs_sid_id), GFP_KERNEL);
>> + if (!epsidid)
>> + return -ENOMEM;
>> +
>> + if (sidtype == SIDOWNER) {
>> + spin_lock(&siduidlock);
>> + psidid = id_rb_add(&uidtree, psid, &sidmap, &epsidid);
>> + spin_unlock(&siduidlock);
>> + } else {
>> + spin_lock(&sidgidlock);
>> + psidid = id_rb_add(&gidtree, psid, &sidmap, &epsidid);
>> + spin_unlock(&sidgidlock);
>> + }
>> +
>> + if (psidid) /* node happened to get added meanwhile */
>> + kfree(epsidid);
>> + else
>> + psidid = epsidid;
>> + }
>> +
>> + if (sidmap == false) { /* node with unmapped SID */
>> + sidstr = kzalloc(SIDLEN, GFP_KERNEL);
>> + if (!sidstr)
>> + rc = -ENOMEM;
>> +
> ^^^^^^^^^^^^
> Why do two allocations for this? The SIDLEN is fixed, so why not just
> allocate the sidstr as part of the cifs_sid_id struct? kmalloc is a
> power-of-two allocator so you'll end up with more wasted memory this
> way. If you really expect to have a lot of these, you might even
> consider making your own slabcache for them to make sure they get
> packed efficiently.
>
OK, will make the change. We do not need to store it now but when we
need to map uid/gid to SID, we could use this structure field.
>> + if (sidtype == SIDOWNER)
>> + sprintf(sidstr, "%s", "os:");
>> + else
>> + sprintf(sidstr, "%s", "gs:");
>> +
> ^^^^^^
> If the sidstr allocation fails, then this will go boom.
yes, I think I had a return here before but missed it during this patch.
Will take care of htis.
>
>> + strptr = sidstr + strlen(sidstr);
>> + sid_to_str(psid, strptr);
>> +
>> + saved_cred = override_creds(root_cred);
>> + idkey = request_key(&cifs_idmap_key_type, sidstr, "");
>> + if (IS_ERR(idkey))
>> + cFYI(1, "%s: Can't map SID to an id", __func__);
>> + else {
>> + id = *(unsigned long *)idkey->payload.value;
>> + key_put(idkey);
>> + clear_bit(SID_ID_UNMAPPED, &psidid->state);
>> + }
>> + psidid->time = jiffies;
>> + psidid->retry = jiffies;
>> + psidid->id = id;
>> + clear_bit(SID_ID_PENDING, &psidid->state);
> ^^^^^^^^^^^
> Yes, you're correct. You do need a wake_up_bit call.
>
>> + revert_creds(saved_cred);
>> + kfree(sidstr);
>> + } else {
>> + /*
>> + * either an existing node with SID mapped (in which case
>> + * we would not wait) or a node whose SID is being mapped
>> + * by somebody else (in which case, we would end up waiting).
>> + */
>> + rc = wait_on_bit(&psidid->state, SID_ID_PENDING,
>> + cifs_sid_pending_wait, TASK_INTERRUPTIBLE);
>> + if (rc) {
>> + cERROR(1, "%s: cifs_sid_pending_wait interrupted %d",
>> + __func__, rc);
>
> ^^^^^^^^^^
> I don't think this deserves a cERROR as this
> might happen normally if the process is
> signalled. cFYI is probably reasonable.
OK, will change to debug level instead of error level printk.
>
>> + return rc;
>> + }
>> +
>> + /*
>> + * No point in checking whether state has bit SID_ID_UNMAPPED
>> + * set. If SID_ID_UNMAPPED state bit is not set, upcall must
>> + * have returned an error. No point in making an upcall here
>> + * again right away, it is likely to fail.
>> + */
>> + id = psidid->id;
> ^^^^^^^
> So, if the upcall fails, you'll map the id to root? Is that
> intended behavior? Maybe you should be returning an
> error of some sort instead, or perhaps mapping to
> "nobody" or something would make more sense?
No, the default is mntt_uid/mnt_gid but the prefered order is
mapped uid/gid, nobody/nogroup, mnt_uid/mnt_gid
It is never root.
>> + }
>> +
>> + if (sidtype == SIDOWNER)
>> + fattr->cf_uid = id;
>> + else
>> + fattr->cf_gid = id;
>> +
>> + return 0;
>> +}
>> +
>> int
>> init_cifs_idmap(void)
>> {
>> @@ -242,16 +494,24 @@ int compare_sids(const struct cifs_sid *ctsid, const
>> struct cifs_sid *cwsid)
>> int num_subauth, num_sat, num_saw;
>>
>> if ((!ctsid) || (!cwsid))
>> - return 0;
>> + return 1;
>>
>> /* compare the revision */
>> - if (ctsid->revision != cwsid->revision)
>> - return 0;
>> + if (ctsid->revision != cwsid->revision) {
>> + if (ctsid->revision > cwsid->revision)
>> + return 1;
>> + else
>> + return -1;
>> + }
>>
>> /* compare all of the six auth values */
>> for (i = 0; i < 6; ++i) {
>> - if (ctsid->authority[i] != cwsid->authority[i])
>> - return 0;
>> + if (ctsid->authority[i] != cwsid->authority[i]) {
>> + if (ctsid->authority[i] > cwsid->authority[i])
>> + return 1;
>> + else
>> + return -1;
>> + }
>> }
>>
>> /* compare all of the subauth values if any */
>> @@ -260,12 +520,16 @@ int compare_sids(const struct cifs_sid *ctsid, const
>> struct cifs_sid *cwsid)
>> num_subauth = num_sat < num_saw ? num_sat : num_saw;
>> if (num_subauth) {
>> for (i = 0; i < num_subauth; ++i) {
>> - if (ctsid->sub_auth[i] != cwsid->sub_auth[i])
>> - return 0;
>> + if (ctsid->sub_auth[i] != cwsid->sub_auth[i]) {
>> + if (ctsid->sub_auth[i] > cwsid->sub_auth[i])
>> + return 1;
>> + else
>> + return -1;
>> + }
>> }
>> }
>>
>> - return 1; /* sids compare/match */
>> + return 0; /* sids compare/match */
>> }
>>
>>
>> @@ -520,22 +784,22 @@ static void parse_dacl(struct cifs_acl *pdacl, char
>> *end_of_acl,
>> #ifdef CONFIG_CIFS_DEBUG2
>> dump_ace(ppace[i], end_of_acl);
>> #endif
>> - if (compare_sids(&(ppace[i]->sid), pownersid))
>> + if (compare_sids(&(ppace[i]->sid), pownersid) == 0)
>> access_flags_to_mode(ppace[i]->access_req,
>> ppace[i]->type,
>> &fattr->cf_mode,
>> &user_mask);
>> - if (compare_sids(&(ppace[i]->sid), pgrpsid))
>> + if (compare_sids(&(ppace[i]->sid), pgrpsid) == 0)
>> access_flags_to_mode(ppace[i]->access_req,
>> ppace[i]->type,
>> &fattr->cf_mode,
>> &group_mask);
>> - if (compare_sids(&(ppace[i]->sid), &sid_everyone))
>> + if (compare_sids(&(ppace[i]->sid), &sid_everyone) == 0)
>> access_flags_to_mode(ppace[i]->access_req,
>> ppace[i]->type,
>> &fattr->cf_mode,
>> &other_mask);
>> - if (compare_sids(&(ppace[i]->sid), &sid_authusers))
>> + if (compare_sids(&(ppace[i]->sid), &sid_authusers) ==
>> 0)
>> access_flags_to_mode(ppace[i]->access_req,
>> ppace[i]->type,
>> &fattr->cf_mode,
>> @@ -613,10 +877,10 @@ static int parse_sid(struct cifs_sid *psid, char
>> *end_of_acl)
>>
>>
>> /* Convert CIFS ACL to POSIX form */
>> -static int parse_sec_desc(struct cifs_ntsd *pntsd, int acl_len,
>> - struct cifs_fattr *fattr)
>> +static int parse_sec_desc(struct cifs_sb_info *cifs_sb,
>> + struct cifs_ntsd *pntsd, int acl_len, struct cifs_fattr *fattr)
>> {
>> - int rc;
>> + int rc = 0;
>> struct cifs_sid *owner_sid_ptr, *group_sid_ptr;
>> struct cifs_acl *dacl_ptr; /* no need for SACL ptr */
>> char *end_of_acl = ((char *)pntsd) + acl_len;
>> @@ -638,12 +902,26 @@ static int parse_sec_desc(struct cifs_ntsd *pntsd, int
>> acl_len,
>> le32_to_cpu(pntsd->sacloffset), dacloffset);
>> /* cifs_dump_mem("owner_sid: ", owner_sid_ptr, 64); */
>> rc = parse_sid(owner_sid_ptr, end_of_acl);
>> - if (rc)
>> + if (rc) {
>> + cFYI(1, "%s: Error %d parsing Owner SID", __func__, rc);
>> return rc;
>> + }
>> + rc = sid_to_id(cifs_sb, owner_sid_ptr, fattr, SIDOWNER);
>> + if (rc) {
>> + cFYI(1, "%s: Error %d mapping Owner SID to uid", __func__, rc);
>> + return rc;
>> + }
>>
>> rc = parse_sid(group_sid_ptr, end_of_acl);
>> - if (rc)
>> + if (rc) {
>> + cFYI(1, "%s: Error %d mapping Owner SID to gid", __func__, rc);
>> return rc;
>> + }
>> + rc = sid_to_id(cifs_sb, group_sid_ptr, fattr, SIDGROUP);
>> + if (rc) {
>> + cFYI(1, "%s: Error %d mapping Group SID to gid", __func__, rc);
>> + return rc;
>> + }
>>
>> if (dacloffset)
>> parse_dacl(dacl_ptr, end_of_acl, owner_sid_ptr,
>> @@ -658,7 +936,7 @@ static int parse_sec_desc(struct cifs_ntsd *pntsd, int
>> acl_len,
>> memcpy((void *)(&(cifscred->gsid)), (void *)group_sid_ptr,
>> sizeof(struct cifs_sid)); */
>>
>> - return 0;
>> + return rc;
>> }
>>
>>
>> @@ -865,7 +1143,7 @@ cifs_acl_to_fattr(struct cifs_sb_info *cifs_sb, struct
>> cifs_fattr *fattr,
>> rc = PTR_ERR(pntsd);
>> cERROR(1, "%s: error %d getting sec desc", __func__, rc);
>> } else {
>> - rc = parse_sec_desc(pntsd, acllen, fattr);
>> + rc = parse_sec_desc(cifs_sb, pntsd, acllen, fattr);
>> kfree(pntsd);
>> if (rc)
>> cERROR(1, "parse sec desc failed rc = %d", rc);
>> diff --git a/fs/cifs/cifsacl.h b/fs/cifs/cifsacl.h
>> index 025e943..5f075c0 100644
>> --- a/fs/cifs/cifsacl.h
>> +++ b/fs/cifs/cifsacl.h
>> @@ -39,6 +39,15 @@
>> #define ACCESS_ALLOWED 0
>> #define ACCESS_DENIED 1
>>
>> +#define SIDOWNER 1
>> +#define SIDGROUP 2
>> +#define SIDLEN 150 /* S- 1 revision- 6 authorities- max 5 sub authorities */
>> +
>> +#define SID_ID_PENDING 0
>> +#define SID_ID_UNMAPPED 1
>> +#define SID_MAP_EXPIRE 1000 /* enough for an upcall to return? */
>> +#define SID_MAP_RETRY 100 /* retry mapping in case prior attempt failed */
>> +
>> struct cifs_ntsd {
>> __le16 revision; /* revision level */
>> __le16 type;
>> @@ -74,6 +83,20 @@ struct cifs_wksid {
>> char sidname[SIDNAMELENGTH];
>> } __attribute__((packed));
>>
>> +struct cifs_sid_id {
>> + struct rb_node rbnode;
>> + struct cifs_sid sid;
>> + unsigned long state;
>> + unsigned long id;
>> + unsigned long time;
>> + unsigned long retry;
>> +};
>> +
>> +#ifdef __KERNEL__
>> +extern struct key_type cifs_idmap_key_type;
>> +extern const struct cred *root_cred;
>> +#endif /* KERNEL */
>> +
>> extern int match_sid(struct cifs_sid *);
>> extern int compare_sids(const struct cifs_sid *, const struct cifs_sid *);
>>
>
>
> --
> Jeff Layton <[email protected]>
>
--
To unsubscribe from this list: send the line "unsubscribe linux-cifs" in
the body of a message to [email protected]
More majordomo info at http://vger.kernel.org/majordomo-info.html