diff options
author | J. Bruce Fields <bfields@citi.umich.edu> | 2010-03-09 17:22:08 -0500 |
---|---|---|
committer | J. Bruce Fields <bfields@citi.umich.edu> | 2010-03-09 17:22:08 -0500 |
commit | e739cf1da48e841bc5d744a99764c1a668b4bdd2 (patch) | |
tree | 1d39318bbbcdd66ad8cd34823ad9befb7af08b1f /fs/namei.c | |
parent | e7b184f199fd3c80b618ec8244cbda70857d2779 (diff) | |
parent | 57d54889cd00db2752994b389ba714138652e60c (diff) |
Merge commit 'v2.6.34-rc1' into for-2.6.35-incoming
Diffstat (limited to 'fs/namei.c')
-rw-r--r-- | fs/namei.c | 571 |
1 files changed, 274 insertions, 297 deletions
diff --git a/fs/namei.c b/fs/namei.c index a4855af776a8..48e60a187325 100644 --- a/fs/namei.c +++ b/fs/namei.c | |||
@@ -19,7 +19,6 @@ | |||
19 | #include <linux/slab.h> | 19 | #include <linux/slab.h> |
20 | #include <linux/fs.h> | 20 | #include <linux/fs.h> |
21 | #include <linux/namei.h> | 21 | #include <linux/namei.h> |
22 | #include <linux/quotaops.h> | ||
23 | #include <linux/pagemap.h> | 22 | #include <linux/pagemap.h> |
24 | #include <linux/fsnotify.h> | 23 | #include <linux/fsnotify.h> |
25 | #include <linux/personality.h> | 24 | #include <linux/personality.h> |
@@ -498,8 +497,6 @@ static int link_path_walk(const char *, struct nameidata *); | |||
498 | 497 | ||
499 | static __always_inline int __vfs_follow_link(struct nameidata *nd, const char *link) | 498 | static __always_inline int __vfs_follow_link(struct nameidata *nd, const char *link) |
500 | { | 499 | { |
501 | int res = 0; | ||
502 | char *name; | ||
503 | if (IS_ERR(link)) | 500 | if (IS_ERR(link)) |
504 | goto fail; | 501 | goto fail; |
505 | 502 | ||
@@ -510,22 +507,7 @@ static __always_inline int __vfs_follow_link(struct nameidata *nd, const char *l | |||
510 | path_get(&nd->root); | 507 | path_get(&nd->root); |
511 | } | 508 | } |
512 | 509 | ||
513 | res = link_path_walk(link, nd); | 510 | return link_path_walk(link, nd); |
514 | if (nd->depth || res || nd->last_type!=LAST_NORM) | ||
515 | return res; | ||
516 | /* | ||
517 | * If it is an iterative symlinks resolution in open_namei() we | ||
518 | * have to copy the last component. And all that crap because of | ||
519 | * bloody create() on broken symlinks. Furrfu... | ||
520 | */ | ||
521 | name = __getname(); | ||
522 | if (unlikely(!name)) { | ||
523 | path_put(&nd->path); | ||
524 | return -ENOMEM; | ||
525 | } | ||
526 | strcpy(name, nd->last.name); | ||
527 | nd->last.name = name; | ||
528 | return 0; | ||
529 | fail: | 511 | fail: |
530 | path_put(&nd->path); | 512 | path_put(&nd->path); |
531 | return PTR_ERR(link); | 513 | return PTR_ERR(link); |
@@ -547,10 +529,10 @@ static inline void path_to_nameidata(struct path *path, struct nameidata *nd) | |||
547 | nd->path.dentry = path->dentry; | 529 | nd->path.dentry = path->dentry; |
548 | } | 530 | } |
549 | 531 | ||
550 | static __always_inline int __do_follow_link(struct path *path, struct nameidata *nd) | 532 | static __always_inline int |
533 | __do_follow_link(struct path *path, struct nameidata *nd, void **p) | ||
551 | { | 534 | { |
552 | int error; | 535 | int error; |
553 | void *cookie; | ||
554 | struct dentry *dentry = path->dentry; | 536 | struct dentry *dentry = path->dentry; |
555 | 537 | ||
556 | touch_atime(path->mnt, dentry); | 538 | touch_atime(path->mnt, dentry); |
@@ -562,9 +544,9 @@ static __always_inline int __do_follow_link(struct path *path, struct nameidata | |||
562 | } | 544 | } |
563 | mntget(path->mnt); | 545 | mntget(path->mnt); |
564 | nd->last_type = LAST_BIND; | 546 | nd->last_type = LAST_BIND; |
565 | cookie = dentry->d_inode->i_op->follow_link(dentry, nd); | 547 | *p = dentry->d_inode->i_op->follow_link(dentry, nd); |
566 | error = PTR_ERR(cookie); | 548 | error = PTR_ERR(*p); |
567 | if (!IS_ERR(cookie)) { | 549 | if (!IS_ERR(*p)) { |
568 | char *s = nd_get_link(nd); | 550 | char *s = nd_get_link(nd); |
569 | error = 0; | 551 | error = 0; |
570 | if (s) | 552 | if (s) |
@@ -574,8 +556,6 @@ static __always_inline int __do_follow_link(struct path *path, struct nameidata | |||
574 | if (error) | 556 | if (error) |
575 | path_put(&nd->path); | 557 | path_put(&nd->path); |
576 | } | 558 | } |
577 | if (dentry->d_inode->i_op->put_link) | ||
578 | dentry->d_inode->i_op->put_link(dentry, nd, cookie); | ||
579 | } | 559 | } |
580 | return error; | 560 | return error; |
581 | } | 561 | } |
@@ -589,6 +569,7 @@ static __always_inline int __do_follow_link(struct path *path, struct nameidata | |||
589 | */ | 569 | */ |
590 | static inline int do_follow_link(struct path *path, struct nameidata *nd) | 570 | static inline int do_follow_link(struct path *path, struct nameidata *nd) |
591 | { | 571 | { |
572 | void *cookie; | ||
592 | int err = -ELOOP; | 573 | int err = -ELOOP; |
593 | if (current->link_count >= MAX_NESTED_LINKS) | 574 | if (current->link_count >= MAX_NESTED_LINKS) |
594 | goto loop; | 575 | goto loop; |
@@ -602,7 +583,9 @@ static inline int do_follow_link(struct path *path, struct nameidata *nd) | |||
602 | current->link_count++; | 583 | current->link_count++; |
603 | current->total_link_count++; | 584 | current->total_link_count++; |
604 | nd->depth++; | 585 | nd->depth++; |
605 | err = __do_follow_link(path, nd); | 586 | err = __do_follow_link(path, nd, &cookie); |
587 | if (!IS_ERR(cookie) && path->dentry->d_inode->i_op->put_link) | ||
588 | path->dentry->d_inode->i_op->put_link(path->dentry, nd, cookie); | ||
606 | path_put(path); | 589 | path_put(path); |
607 | current->link_count--; | 590 | current->link_count--; |
608 | nd->depth--; | 591 | nd->depth--; |
@@ -689,33 +672,20 @@ static __always_inline void follow_dotdot(struct nameidata *nd) | |||
689 | set_root(nd); | 672 | set_root(nd); |
690 | 673 | ||
691 | while(1) { | 674 | while(1) { |
692 | struct vfsmount *parent; | ||
693 | struct dentry *old = nd->path.dentry; | 675 | struct dentry *old = nd->path.dentry; |
694 | 676 | ||
695 | if (nd->path.dentry == nd->root.dentry && | 677 | if (nd->path.dentry == nd->root.dentry && |
696 | nd->path.mnt == nd->root.mnt) { | 678 | nd->path.mnt == nd->root.mnt) { |
697 | break; | 679 | break; |
698 | } | 680 | } |
699 | spin_lock(&dcache_lock); | ||
700 | if (nd->path.dentry != nd->path.mnt->mnt_root) { | 681 | if (nd->path.dentry != nd->path.mnt->mnt_root) { |
701 | nd->path.dentry = dget(nd->path.dentry->d_parent); | 682 | /* rare case of legitimate dget_parent()... */ |
702 | spin_unlock(&dcache_lock); | 683 | nd->path.dentry = dget_parent(nd->path.dentry); |
703 | dput(old); | 684 | dput(old); |
704 | break; | 685 | break; |
705 | } | 686 | } |
706 | spin_unlock(&dcache_lock); | 687 | if (!follow_up(&nd->path)) |
707 | spin_lock(&vfsmount_lock); | ||
708 | parent = nd->path.mnt->mnt_parent; | ||
709 | if (parent == nd->path.mnt) { | ||
710 | spin_unlock(&vfsmount_lock); | ||
711 | break; | 688 | break; |
712 | } | ||
713 | mntget(parent); | ||
714 | nd->path.dentry = dget(nd->path.mnt->mnt_mountpoint); | ||
715 | spin_unlock(&vfsmount_lock); | ||
716 | dput(old); | ||
717 | mntput(nd->path.mnt); | ||
718 | nd->path.mnt = parent; | ||
719 | } | 689 | } |
720 | follow_mount(&nd->path); | 690 | follow_mount(&nd->path); |
721 | } | 691 | } |
@@ -1347,7 +1317,7 @@ static int may_delete(struct inode *dir,struct dentry *victim,int isdir) | |||
1347 | return -ENOENT; | 1317 | return -ENOENT; |
1348 | 1318 | ||
1349 | BUG_ON(victim->d_parent->d_inode != dir); | 1319 | BUG_ON(victim->d_parent->d_inode != dir); |
1350 | audit_inode_child(victim->d_name.name, victim, dir); | 1320 | audit_inode_child(victim, dir); |
1351 | 1321 | ||
1352 | error = inode_permission(dir, MAY_WRITE | MAY_EXEC); | 1322 | error = inode_permission(dir, MAY_WRITE | MAY_EXEC); |
1353 | if (error) | 1323 | if (error) |
@@ -1388,22 +1358,6 @@ static inline int may_create(struct inode *dir, struct dentry *child) | |||
1388 | return inode_permission(dir, MAY_WRITE | MAY_EXEC); | 1358 | return inode_permission(dir, MAY_WRITE | MAY_EXEC); |
1389 | } | 1359 | } |
1390 | 1360 | ||
1391 | /* | ||
1392 | * O_DIRECTORY translates into forcing a directory lookup. | ||
1393 | */ | ||
1394 | static inline int lookup_flags(unsigned int f) | ||
1395 | { | ||
1396 | unsigned long retval = LOOKUP_FOLLOW; | ||
1397 | |||
1398 | if (f & O_NOFOLLOW) | ||
1399 | retval &= ~LOOKUP_FOLLOW; | ||
1400 | |||
1401 | if (f & O_DIRECTORY) | ||
1402 | retval |= LOOKUP_DIRECTORY; | ||
1403 | |||
1404 | return retval; | ||
1405 | } | ||
1406 | |||
1407 | /* | 1361 | /* |
1408 | * p1 and p2 should be directories on the same fs. | 1362 | * p1 and p2 should be directories on the same fs. |
1409 | */ | 1363 | */ |
@@ -1461,7 +1415,6 @@ int vfs_create(struct inode *dir, struct dentry *dentry, int mode, | |||
1461 | error = security_inode_create(dir, dentry, mode); | 1415 | error = security_inode_create(dir, dentry, mode); |
1462 | if (error) | 1416 | if (error) |
1463 | return error; | 1417 | return error; |
1464 | vfs_dq_init(dir); | ||
1465 | error = dir->i_op->create(dir, dentry, mode, nd); | 1418 | error = dir->i_op->create(dir, dentry, mode, nd); |
1466 | if (!error) | 1419 | if (!error) |
1467 | fsnotify_create(dir, dentry); | 1420 | fsnotify_create(dir, dentry); |
@@ -1503,7 +1456,7 @@ int may_open(struct path *path, int acc_mode, int flag) | |||
1503 | * An append-only file must be opened in append mode for writing. | 1456 | * An append-only file must be opened in append mode for writing. |
1504 | */ | 1457 | */ |
1505 | if (IS_APPEND(inode)) { | 1458 | if (IS_APPEND(inode)) { |
1506 | if ((flag & FMODE_WRITE) && !(flag & O_APPEND)) | 1459 | if ((flag & O_ACCMODE) != O_RDONLY && !(flag & O_APPEND)) |
1507 | return -EPERM; | 1460 | return -EPERM; |
1508 | if (flag & O_TRUNC) | 1461 | if (flag & O_TRUNC) |
1509 | return -EPERM; | 1462 | return -EPERM; |
@@ -1547,7 +1500,7 @@ static int handle_truncate(struct path *path) | |||
1547 | * what get passed to sys_open(). | 1500 | * what get passed to sys_open(). |
1548 | */ | 1501 | */ |
1549 | static int __open_namei_create(struct nameidata *nd, struct path *path, | 1502 | static int __open_namei_create(struct nameidata *nd, struct path *path, |
1550 | int flag, int mode) | 1503 | int open_flag, int mode) |
1551 | { | 1504 | { |
1552 | int error; | 1505 | int error; |
1553 | struct dentry *dir = nd->path.dentry; | 1506 | struct dentry *dir = nd->path.dentry; |
@@ -1565,7 +1518,7 @@ out_unlock: | |||
1565 | if (error) | 1518 | if (error) |
1566 | return error; | 1519 | return error; |
1567 | /* Don't check for write permission, don't truncate */ | 1520 | /* Don't check for write permission, don't truncate */ |
1568 | return may_open(&nd->path, 0, flag & ~O_TRUNC); | 1521 | return may_open(&nd->path, 0, open_flag & ~O_TRUNC); |
1569 | } | 1522 | } |
1570 | 1523 | ||
1571 | /* | 1524 | /* |
@@ -1603,129 +1556,132 @@ static int open_will_truncate(int flag, struct inode *inode) | |||
1603 | return (flag & O_TRUNC); | 1556 | return (flag & O_TRUNC); |
1604 | } | 1557 | } |
1605 | 1558 | ||
1606 | /* | 1559 | static struct file *finish_open(struct nameidata *nd, |
1607 | * Note that the low bits of the passed in "open_flag" | 1560 | int open_flag, int acc_mode) |
1608 | * are not the same as in the local variable "flag". See | ||
1609 | * open_to_namei_flags() for more details. | ||
1610 | */ | ||
1611 | struct file *do_filp_open(int dfd, const char *pathname, | ||
1612 | int open_flag, int mode, int acc_mode) | ||
1613 | { | 1561 | { |
1614 | struct file *filp; | 1562 | struct file *filp; |
1615 | struct nameidata nd; | ||
1616 | int error; | ||
1617 | struct path path; | ||
1618 | struct dentry *dir; | ||
1619 | int count = 0; | ||
1620 | int will_truncate; | 1563 | int will_truncate; |
1621 | int flag = open_to_namei_flags(open_flag); | 1564 | int error; |
1622 | int force_reval = 0; | ||
1623 | 1565 | ||
1566 | will_truncate = open_will_truncate(open_flag, nd->path.dentry->d_inode); | ||
1567 | if (will_truncate) { | ||
1568 | error = mnt_want_write(nd->path.mnt); | ||
1569 | if (error) | ||
1570 | goto exit; | ||
1571 | } | ||
1572 | error = may_open(&nd->path, acc_mode, open_flag); | ||
1573 | if (error) { | ||
1574 | if (will_truncate) | ||
1575 | mnt_drop_write(nd->path.mnt); | ||
1576 | goto exit; | ||
1577 | } | ||
1578 | filp = nameidata_to_filp(nd); | ||
1579 | if (!IS_ERR(filp)) { | ||
1580 | error = ima_file_check(filp, acc_mode); | ||
1581 | if (error) { | ||
1582 | fput(filp); | ||
1583 | filp = ERR_PTR(error); | ||
1584 | } | ||
1585 | } | ||
1586 | if (!IS_ERR(filp)) { | ||
1587 | if (will_truncate) { | ||
1588 | error = handle_truncate(&nd->path); | ||
1589 | if (error) { | ||
1590 | fput(filp); | ||
1591 | filp = ERR_PTR(error); | ||
1592 | } | ||
1593 | } | ||
1594 | } | ||
1624 | /* | 1595 | /* |
1625 | * O_SYNC is implemented as __O_SYNC|O_DSYNC. As many places only | 1596 | * It is now safe to drop the mnt write |
1626 | * check for O_DSYNC if the need any syncing at all we enforce it's | 1597 | * because the filp has had a write taken |
1627 | * always set instead of having to deal with possibly weird behaviour | 1598 | * on its behalf. |
1628 | * for malicious applications setting only __O_SYNC. | ||
1629 | */ | 1599 | */ |
1630 | if (open_flag & __O_SYNC) | 1600 | if (will_truncate) |
1631 | open_flag |= O_DSYNC; | 1601 | mnt_drop_write(nd->path.mnt); |
1632 | 1602 | return filp; | |
1633 | if (!acc_mode) | ||
1634 | acc_mode = MAY_OPEN | ACC_MODE(open_flag); | ||
1635 | 1603 | ||
1636 | /* O_TRUNC implies we need access checks for write permissions */ | 1604 | exit: |
1637 | if (flag & O_TRUNC) | 1605 | if (!IS_ERR(nd->intent.open.file)) |
1638 | acc_mode |= MAY_WRITE; | 1606 | release_open_intent(nd); |
1607 | path_put(&nd->path); | ||
1608 | return ERR_PTR(error); | ||
1609 | } | ||
1639 | 1610 | ||
1640 | /* Allow the LSM permission hook to distinguish append | 1611 | static struct file *do_last(struct nameidata *nd, struct path *path, |
1641 | access from general write access. */ | 1612 | int open_flag, int acc_mode, |
1642 | if (flag & O_APPEND) | 1613 | int mode, const char *pathname, |
1643 | acc_mode |= MAY_APPEND; | 1614 | int *want_dir) |
1615 | { | ||
1616 | struct dentry *dir = nd->path.dentry; | ||
1617 | struct file *filp; | ||
1618 | int error = -EISDIR; | ||
1644 | 1619 | ||
1645 | /* | 1620 | switch (nd->last_type) { |
1646 | * The simplest case - just a plain lookup. | 1621 | case LAST_DOTDOT: |
1647 | */ | 1622 | follow_dotdot(nd); |
1648 | if (!(flag & O_CREAT)) { | 1623 | dir = nd->path.dentry; |
1649 | filp = get_empty_filp(); | 1624 | if (nd->path.mnt->mnt_sb->s_type->fs_flags & FS_REVAL_DOT) { |
1650 | 1625 | if (!dir->d_op->d_revalidate(dir, nd)) { | |
1651 | if (filp == NULL) | 1626 | error = -ESTALE; |
1652 | return ERR_PTR(-ENFILE); | 1627 | goto exit; |
1653 | nd.intent.open.file = filp; | ||
1654 | filp->f_flags = open_flag; | ||
1655 | nd.intent.open.flags = flag; | ||
1656 | nd.intent.open.create_mode = 0; | ||
1657 | error = do_path_lookup(dfd, pathname, | ||
1658 | lookup_flags(flag)|LOOKUP_OPEN, &nd); | ||
1659 | if (IS_ERR(nd.intent.open.file)) { | ||
1660 | if (error == 0) { | ||
1661 | error = PTR_ERR(nd.intent.open.file); | ||
1662 | path_put(&nd.path); | ||
1663 | } | 1628 | } |
1664 | } else if (error) | 1629 | } |
1665 | release_open_intent(&nd); | 1630 | /* fallthrough */ |
1666 | if (error) | 1631 | case LAST_DOT: |
1667 | return ERR_PTR(error); | 1632 | case LAST_ROOT: |
1633 | if (open_flag & O_CREAT) | ||
1634 | goto exit; | ||
1635 | /* fallthrough */ | ||
1636 | case LAST_BIND: | ||
1637 | audit_inode(pathname, dir); | ||
1668 | goto ok; | 1638 | goto ok; |
1669 | } | 1639 | } |
1670 | 1640 | ||
1671 | /* | 1641 | /* trailing slashes? */ |
1672 | * Create - we need to know the parent. | 1642 | if (nd->last.name[nd->last.len]) { |
1673 | */ | 1643 | if (open_flag & O_CREAT) |
1674 | reval: | 1644 | goto exit; |
1675 | error = path_init(dfd, pathname, LOOKUP_PARENT, &nd); | 1645 | *want_dir = 1; |
1676 | if (error) | ||
1677 | return ERR_PTR(error); | ||
1678 | if (force_reval) | ||
1679 | nd.flags |= LOOKUP_REVAL; | ||
1680 | error = path_walk(pathname, &nd); | ||
1681 | if (error) { | ||
1682 | if (nd.root.mnt) | ||
1683 | path_put(&nd.root); | ||
1684 | return ERR_PTR(error); | ||
1685 | } | 1646 | } |
1686 | if (unlikely(!audit_dummy_context())) | ||
1687 | audit_inode(pathname, nd.path.dentry); | ||
1688 | 1647 | ||
1689 | /* | 1648 | /* just plain open? */ |
1690 | * We have the parent and last component. First of all, check | 1649 | if (!(open_flag & O_CREAT)) { |
1691 | * that we are not asked to creat(2) an obvious directory - that | 1650 | error = do_lookup(nd, &nd->last, path); |
1692 | * will not do. | 1651 | if (error) |
1693 | */ | 1652 | goto exit; |
1694 | error = -EISDIR; | 1653 | error = -ENOENT; |
1695 | if (nd.last_type != LAST_NORM || nd.last.name[nd.last.len]) | 1654 | if (!path->dentry->d_inode) |
1696 | goto exit_parent; | 1655 | goto exit_dput; |
1656 | if (path->dentry->d_inode->i_op->follow_link) | ||
1657 | return NULL; | ||
1658 | error = -ENOTDIR; | ||
1659 | if (*want_dir && !path->dentry->d_inode->i_op->lookup) | ||
1660 | goto exit_dput; | ||
1661 | path_to_nameidata(path, nd); | ||
1662 | audit_inode(pathname, nd->path.dentry); | ||
1663 | goto ok; | ||
1664 | } | ||
1697 | 1665 | ||
1698 | error = -ENFILE; | 1666 | /* OK, it's O_CREAT */ |
1699 | filp = get_empty_filp(); | ||
1700 | if (filp == NULL) | ||
1701 | goto exit_parent; | ||
1702 | nd.intent.open.file = filp; | ||
1703 | filp->f_flags = open_flag; | ||
1704 | nd.intent.open.flags = flag; | ||
1705 | nd.intent.open.create_mode = mode; | ||
1706 | dir = nd.path.dentry; | ||
1707 | nd.flags &= ~LOOKUP_PARENT; | ||
1708 | nd.flags |= LOOKUP_CREATE | LOOKUP_OPEN; | ||
1709 | if (flag & O_EXCL) | ||
1710 | nd.flags |= LOOKUP_EXCL; | ||
1711 | mutex_lock(&dir->d_inode->i_mutex); | 1667 | mutex_lock(&dir->d_inode->i_mutex); |
1712 | path.dentry = lookup_hash(&nd); | ||
1713 | path.mnt = nd.path.mnt; | ||
1714 | 1668 | ||
1715 | do_last: | 1669 | path->dentry = lookup_hash(nd); |
1716 | error = PTR_ERR(path.dentry); | 1670 | path->mnt = nd->path.mnt; |
1717 | if (IS_ERR(path.dentry)) { | 1671 | |
1672 | error = PTR_ERR(path->dentry); | ||
1673 | if (IS_ERR(path->dentry)) { | ||
1718 | mutex_unlock(&dir->d_inode->i_mutex); | 1674 | mutex_unlock(&dir->d_inode->i_mutex); |
1719 | goto exit; | 1675 | goto exit; |
1720 | } | 1676 | } |
1721 | 1677 | ||
1722 | if (IS_ERR(nd.intent.open.file)) { | 1678 | if (IS_ERR(nd->intent.open.file)) { |
1723 | error = PTR_ERR(nd.intent.open.file); | 1679 | error = PTR_ERR(nd->intent.open.file); |
1724 | goto exit_mutex_unlock; | 1680 | goto exit_mutex_unlock; |
1725 | } | 1681 | } |
1726 | 1682 | ||
1727 | /* Negative dentry, just create the file */ | 1683 | /* Negative dentry, just create the file */ |
1728 | if (!path.dentry->d_inode) { | 1684 | if (!path->dentry->d_inode) { |
1729 | /* | 1685 | /* |
1730 | * This write is needed to ensure that a | 1686 | * This write is needed to ensure that a |
1731 | * ro->rw transition does not occur between | 1687 | * ro->rw transition does not occur between |
@@ -1733,18 +1689,16 @@ do_last: | |||
1733 | * a permanent write count is taken through | 1689 | * a permanent write count is taken through |
1734 | * the 'struct file' in nameidata_to_filp(). | 1690 | * the 'struct file' in nameidata_to_filp(). |
1735 | */ | 1691 | */ |
1736 | error = mnt_want_write(nd.path.mnt); | 1692 | error = mnt_want_write(nd->path.mnt); |
1737 | if (error) | 1693 | if (error) |
1738 | goto exit_mutex_unlock; | 1694 | goto exit_mutex_unlock; |
1739 | error = __open_namei_create(&nd, &path, flag, mode); | 1695 | error = __open_namei_create(nd, path, open_flag, mode); |
1740 | if (error) { | 1696 | if (error) { |
1741 | mnt_drop_write(nd.path.mnt); | 1697 | mnt_drop_write(nd->path.mnt); |
1742 | goto exit; | 1698 | goto exit; |
1743 | } | 1699 | } |
1744 | filp = nameidata_to_filp(&nd); | 1700 | filp = nameidata_to_filp(nd); |
1745 | mnt_drop_write(nd.path.mnt); | 1701 | mnt_drop_write(nd->path.mnt); |
1746 | if (nd.root.mnt) | ||
1747 | path_put(&nd.root); | ||
1748 | if (!IS_ERR(filp)) { | 1702 | if (!IS_ERR(filp)) { |
1749 | error = ima_file_check(filp, acc_mode); | 1703 | error = ima_file_check(filp, acc_mode); |
1750 | if (error) { | 1704 | if (error) { |
@@ -1759,150 +1713,181 @@ do_last: | |||
1759 | * It already exists. | 1713 | * It already exists. |
1760 | */ | 1714 | */ |
1761 | mutex_unlock(&dir->d_inode->i_mutex); | 1715 | mutex_unlock(&dir->d_inode->i_mutex); |
1762 | audit_inode(pathname, path.dentry); | 1716 | audit_inode(pathname, path->dentry); |
1763 | 1717 | ||
1764 | error = -EEXIST; | 1718 | error = -EEXIST; |
1765 | if (flag & O_EXCL) | 1719 | if (open_flag & O_EXCL) |
1766 | goto exit_dput; | 1720 | goto exit_dput; |
1767 | 1721 | ||
1768 | if (__follow_mount(&path)) { | 1722 | if (__follow_mount(path)) { |
1769 | error = -ELOOP; | 1723 | error = -ELOOP; |
1770 | if (flag & O_NOFOLLOW) | 1724 | if (open_flag & O_NOFOLLOW) |
1771 | goto exit_dput; | 1725 | goto exit_dput; |
1772 | } | 1726 | } |
1773 | 1727 | ||
1774 | error = -ENOENT; | 1728 | error = -ENOENT; |
1775 | if (!path.dentry->d_inode) | 1729 | if (!path->dentry->d_inode) |
1776 | goto exit_dput; | 1730 | goto exit_dput; |
1777 | if (path.dentry->d_inode->i_op->follow_link) | ||
1778 | goto do_link; | ||
1779 | 1731 | ||
1780 | path_to_nameidata(&path, &nd); | 1732 | if (path->dentry->d_inode->i_op->follow_link) |
1733 | return NULL; | ||
1734 | |||
1735 | path_to_nameidata(path, nd); | ||
1781 | error = -EISDIR; | 1736 | error = -EISDIR; |
1782 | if (S_ISDIR(path.dentry->d_inode->i_mode)) | 1737 | if (S_ISDIR(path->dentry->d_inode->i_mode)) |
1783 | goto exit; | 1738 | goto exit; |
1784 | ok: | 1739 | ok: |
1740 | filp = finish_open(nd, open_flag, acc_mode); | ||
1741 | return filp; | ||
1742 | |||
1743 | exit_mutex_unlock: | ||
1744 | mutex_unlock(&dir->d_inode->i_mutex); | ||
1745 | exit_dput: | ||
1746 | path_put_conditional(path, nd); | ||
1747 | exit: | ||
1748 | if (!IS_ERR(nd->intent.open.file)) | ||
1749 | release_open_intent(nd); | ||
1750 | path_put(&nd->path); | ||
1751 | return ERR_PTR(error); | ||
1752 | } | ||
1753 | |||
1754 | /* | ||
1755 | * Note that the low bits of the passed in "open_flag" | ||
1756 | * are not the same as in the local variable "flag". See | ||
1757 | * open_to_namei_flags() for more details. | ||
1758 | */ | ||
1759 | struct file *do_filp_open(int dfd, const char *pathname, | ||
1760 | int open_flag, int mode, int acc_mode) | ||
1761 | { | ||
1762 | struct file *filp; | ||
1763 | struct nameidata nd; | ||
1764 | int error; | ||
1765 | struct path path; | ||
1766 | int count = 0; | ||
1767 | int flag = open_to_namei_flags(open_flag); | ||
1768 | int force_reval = 0; | ||
1769 | int want_dir = open_flag & O_DIRECTORY; | ||
1770 | |||
1771 | if (!(open_flag & O_CREAT)) | ||
1772 | mode = 0; | ||
1773 | |||
1785 | /* | 1774 | /* |
1786 | * Consider: | 1775 | * O_SYNC is implemented as __O_SYNC|O_DSYNC. As many places only |
1787 | * 1. may_open() truncates a file | 1776 | * check for O_DSYNC if the need any syncing at all we enforce it's |
1788 | * 2. a rw->ro mount transition occurs | 1777 | * always set instead of having to deal with possibly weird behaviour |
1789 | * 3. nameidata_to_filp() fails due to | 1778 | * for malicious applications setting only __O_SYNC. |
1790 | * the ro mount. | ||
1791 | * That would be inconsistent, and should | ||
1792 | * be avoided. Taking this mnt write here | ||
1793 | * ensures that (2) can not occur. | ||
1794 | */ | 1779 | */ |
1795 | will_truncate = open_will_truncate(flag, nd.path.dentry->d_inode); | 1780 | if (open_flag & __O_SYNC) |
1796 | if (will_truncate) { | 1781 | open_flag |= O_DSYNC; |
1797 | error = mnt_want_write(nd.path.mnt); | 1782 | |
1798 | if (error) | 1783 | if (!acc_mode) |
1799 | goto exit; | 1784 | acc_mode = MAY_OPEN | ACC_MODE(open_flag); |
1800 | } | 1785 | |
1801 | error = may_open(&nd.path, acc_mode, flag); | 1786 | /* O_TRUNC implies we need access checks for write permissions */ |
1787 | if (open_flag & O_TRUNC) | ||
1788 | acc_mode |= MAY_WRITE; | ||
1789 | |||
1790 | /* Allow the LSM permission hook to distinguish append | ||
1791 | access from general write access. */ | ||
1792 | if (open_flag & O_APPEND) | ||
1793 | acc_mode |= MAY_APPEND; | ||
1794 | |||
1795 | /* find the parent */ | ||
1796 | reval: | ||
1797 | error = path_init(dfd, pathname, LOOKUP_PARENT, &nd); | ||
1798 | if (error) | ||
1799 | return ERR_PTR(error); | ||
1800 | if (force_reval) | ||
1801 | nd.flags |= LOOKUP_REVAL; | ||
1802 | |||
1803 | current->total_link_count = 0; | ||
1804 | error = link_path_walk(pathname, &nd); | ||
1802 | if (error) { | 1805 | if (error) { |
1803 | if (will_truncate) | 1806 | filp = ERR_PTR(error); |
1804 | mnt_drop_write(nd.path.mnt); | 1807 | goto out; |
1805 | goto exit; | ||
1806 | } | ||
1807 | filp = nameidata_to_filp(&nd); | ||
1808 | if (!IS_ERR(filp)) { | ||
1809 | error = ima_file_check(filp, acc_mode); | ||
1810 | if (error) { | ||
1811 | fput(filp); | ||
1812 | filp = ERR_PTR(error); | ||
1813 | } | ||
1814 | } | 1808 | } |
1815 | if (!IS_ERR(filp)) { | 1809 | if (unlikely(!audit_dummy_context()) && (open_flag & O_CREAT)) |
1816 | if (acc_mode & MAY_WRITE) | 1810 | audit_inode(pathname, nd.path.dentry); |
1817 | vfs_dq_init(nd.path.dentry->d_inode); | ||
1818 | 1811 | ||
1819 | if (will_truncate) { | ||
1820 | error = handle_truncate(&nd.path); | ||
1821 | if (error) { | ||
1822 | fput(filp); | ||
1823 | filp = ERR_PTR(error); | ||
1824 | } | ||
1825 | } | ||
1826 | } | ||
1827 | /* | 1812 | /* |
1828 | * It is now safe to drop the mnt write | 1813 | * We have the parent and last component. |
1829 | * because the filp has had a write taken | ||
1830 | * on its behalf. | ||
1831 | */ | 1814 | */ |
1832 | if (will_truncate) | 1815 | |
1833 | mnt_drop_write(nd.path.mnt); | 1816 | error = -ENFILE; |
1817 | filp = get_empty_filp(); | ||
1818 | if (filp == NULL) | ||
1819 | goto exit_parent; | ||
1820 | nd.intent.open.file = filp; | ||
1821 | filp->f_flags = open_flag; | ||
1822 | nd.intent.open.flags = flag; | ||
1823 | nd.intent.open.create_mode = mode; | ||
1824 | nd.flags &= ~LOOKUP_PARENT; | ||
1825 | nd.flags |= LOOKUP_OPEN; | ||
1826 | if (open_flag & O_CREAT) { | ||
1827 | nd.flags |= LOOKUP_CREATE; | ||
1828 | if (open_flag & O_EXCL) | ||
1829 | nd.flags |= LOOKUP_EXCL; | ||
1830 | } | ||
1831 | filp = do_last(&nd, &path, open_flag, acc_mode, mode, pathname, &want_dir); | ||
1832 | while (unlikely(!filp)) { /* trailing symlink */ | ||
1833 | struct path holder; | ||
1834 | struct inode *inode = path.dentry->d_inode; | ||
1835 | void *cookie; | ||
1836 | error = -ELOOP; | ||
1837 | /* S_ISDIR part is a temporary automount kludge */ | ||
1838 | if ((open_flag & O_NOFOLLOW) && !S_ISDIR(inode->i_mode)) | ||
1839 | goto exit_dput; | ||
1840 | if (count++ == 32) | ||
1841 | goto exit_dput; | ||
1842 | /* | ||
1843 | * This is subtle. Instead of calling do_follow_link() we do | ||
1844 | * the thing by hands. The reason is that this way we have zero | ||
1845 | * link_count and path_walk() (called from ->follow_link) | ||
1846 | * honoring LOOKUP_PARENT. After that we have the parent and | ||
1847 | * last component, i.e. we are in the same situation as after | ||
1848 | * the first path_walk(). Well, almost - if the last component | ||
1849 | * is normal we get its copy stored in nd->last.name and we will | ||
1850 | * have to putname() it when we are done. Procfs-like symlinks | ||
1851 | * just set LAST_BIND. | ||
1852 | */ | ||
1853 | nd.flags |= LOOKUP_PARENT; | ||
1854 | error = security_inode_follow_link(path.dentry, &nd); | ||
1855 | if (error) | ||
1856 | goto exit_dput; | ||
1857 | error = __do_follow_link(&path, &nd, &cookie); | ||
1858 | if (unlikely(error)) { | ||
1859 | /* nd.path had been dropped */ | ||
1860 | if (!IS_ERR(cookie) && inode->i_op->put_link) | ||
1861 | inode->i_op->put_link(path.dentry, &nd, cookie); | ||
1862 | path_put(&path); | ||
1863 | release_open_intent(&nd); | ||
1864 | filp = ERR_PTR(error); | ||
1865 | goto out; | ||
1866 | } | ||
1867 | holder = path; | ||
1868 | nd.flags &= ~LOOKUP_PARENT; | ||
1869 | filp = do_last(&nd, &path, open_flag, acc_mode, mode, pathname, &want_dir); | ||
1870 | if (inode->i_op->put_link) | ||
1871 | inode->i_op->put_link(holder.dentry, &nd, cookie); | ||
1872 | path_put(&holder); | ||
1873 | } | ||
1874 | out: | ||
1834 | if (nd.root.mnt) | 1875 | if (nd.root.mnt) |
1835 | path_put(&nd.root); | 1876 | path_put(&nd.root); |
1877 | if (filp == ERR_PTR(-ESTALE) && !force_reval) { | ||
1878 | force_reval = 1; | ||
1879 | goto reval; | ||
1880 | } | ||
1836 | return filp; | 1881 | return filp; |
1837 | 1882 | ||
1838 | exit_mutex_unlock: | ||
1839 | mutex_unlock(&dir->d_inode->i_mutex); | ||
1840 | exit_dput: | 1883 | exit_dput: |
1841 | path_put_conditional(&path, &nd); | 1884 | path_put_conditional(&path, &nd); |
1842 | exit: | ||
1843 | if (!IS_ERR(nd.intent.open.file)) | 1885 | if (!IS_ERR(nd.intent.open.file)) |
1844 | release_open_intent(&nd); | 1886 | release_open_intent(&nd); |
1845 | exit_parent: | 1887 | exit_parent: |
1846 | if (nd.root.mnt) | ||
1847 | path_put(&nd.root); | ||
1848 | path_put(&nd.path); | 1888 | path_put(&nd.path); |
1849 | return ERR_PTR(error); | 1889 | filp = ERR_PTR(error); |
1850 | 1890 | goto out; | |
1851 | do_link: | ||
1852 | error = -ELOOP; | ||
1853 | if (flag & O_NOFOLLOW) | ||
1854 | goto exit_dput; | ||
1855 | /* | ||
1856 | * This is subtle. Instead of calling do_follow_link() we do the | ||
1857 | * thing by hands. The reason is that this way we have zero link_count | ||
1858 | * and path_walk() (called from ->follow_link) honoring LOOKUP_PARENT. | ||
1859 | * After that we have the parent and last component, i.e. | ||
1860 | * we are in the same situation as after the first path_walk(). | ||
1861 | * Well, almost - if the last component is normal we get its copy | ||
1862 | * stored in nd->last.name and we will have to putname() it when we | ||
1863 | * are done. Procfs-like symlinks just set LAST_BIND. | ||
1864 | */ | ||
1865 | nd.flags |= LOOKUP_PARENT; | ||
1866 | error = security_inode_follow_link(path.dentry, &nd); | ||
1867 | if (error) | ||
1868 | goto exit_dput; | ||
1869 | error = __do_follow_link(&path, &nd); | ||
1870 | path_put(&path); | ||
1871 | if (error) { | ||
1872 | /* Does someone understand code flow here? Or it is only | ||
1873 | * me so stupid? Anathema to whoever designed this non-sense | ||
1874 | * with "intent.open". | ||
1875 | */ | ||
1876 | release_open_intent(&nd); | ||
1877 | if (nd.root.mnt) | ||
1878 | path_put(&nd.root); | ||
1879 | if (error == -ESTALE && !force_reval) { | ||
1880 | force_reval = 1; | ||
1881 | goto reval; | ||
1882 | } | ||
1883 | return ERR_PTR(error); | ||
1884 | } | ||
1885 | nd.flags &= ~LOOKUP_PARENT; | ||
1886 | if (nd.last_type == LAST_BIND) | ||
1887 | goto ok; | ||
1888 | error = -EISDIR; | ||
1889 | if (nd.last_type != LAST_NORM) | ||
1890 | goto exit; | ||
1891 | if (nd.last.name[nd.last.len]) { | ||
1892 | __putname(nd.last.name); | ||
1893 | goto exit; | ||
1894 | } | ||
1895 | error = -ELOOP; | ||
1896 | if (count++==32) { | ||
1897 | __putname(nd.last.name); | ||
1898 | goto exit; | ||
1899 | } | ||
1900 | dir = nd.path.dentry; | ||
1901 | mutex_lock(&dir->d_inode->i_mutex); | ||
1902 | path.dentry = lookup_hash(&nd); | ||
1903 | path.mnt = nd.path.mnt; | ||
1904 | __putname(nd.last.name); | ||
1905 | goto do_last; | ||
1906 | } | 1891 | } |
1907 | 1892 | ||
1908 | /** | 1893 | /** |
@@ -1996,7 +1981,6 @@ int vfs_mknod(struct inode *dir, struct dentry *dentry, int mode, dev_t dev) | |||
1996 | if (error) | 1981 | if (error) |
1997 | return error; | 1982 | return error; |
1998 | 1983 | ||
1999 | vfs_dq_init(dir); | ||
2000 | error = dir->i_op->mknod(dir, dentry, mode, dev); | 1984 | error = dir->i_op->mknod(dir, dentry, mode, dev); |
2001 | if (!error) | 1985 | if (!error) |
2002 | fsnotify_create(dir, dentry); | 1986 | fsnotify_create(dir, dentry); |
@@ -2095,7 +2079,6 @@ int vfs_mkdir(struct inode *dir, struct dentry *dentry, int mode) | |||
2095 | if (error) | 2079 | if (error) |
2096 | return error; | 2080 | return error; |
2097 | 2081 | ||
2098 | vfs_dq_init(dir); | ||
2099 | error = dir->i_op->mkdir(dir, dentry, mode); | 2082 | error = dir->i_op->mkdir(dir, dentry, mode); |
2100 | if (!error) | 2083 | if (!error) |
2101 | fsnotify_mkdir(dir, dentry); | 2084 | fsnotify_mkdir(dir, dentry); |
@@ -2181,8 +2164,6 @@ int vfs_rmdir(struct inode *dir, struct dentry *dentry) | |||
2181 | if (!dir->i_op->rmdir) | 2164 | if (!dir->i_op->rmdir) |
2182 | return -EPERM; | 2165 | return -EPERM; |
2183 | 2166 | ||
2184 | vfs_dq_init(dir); | ||
2185 | |||
2186 | mutex_lock(&dentry->d_inode->i_mutex); | 2167 | mutex_lock(&dentry->d_inode->i_mutex); |
2187 | dentry_unhash(dentry); | 2168 | dentry_unhash(dentry); |
2188 | if (d_mountpoint(dentry)) | 2169 | if (d_mountpoint(dentry)) |
@@ -2268,15 +2249,16 @@ int vfs_unlink(struct inode *dir, struct dentry *dentry) | |||
2268 | if (!dir->i_op->unlink) | 2249 | if (!dir->i_op->unlink) |
2269 | return -EPERM; | 2250 | return -EPERM; |
2270 | 2251 | ||
2271 | vfs_dq_init(dir); | ||
2272 | |||
2273 | mutex_lock(&dentry->d_inode->i_mutex); | 2252 | mutex_lock(&dentry->d_inode->i_mutex); |
2274 | if (d_mountpoint(dentry)) | 2253 | if (d_mountpoint(dentry)) |
2275 | error = -EBUSY; | 2254 | error = -EBUSY; |
2276 | else { | 2255 | else { |
2277 | error = security_inode_unlink(dir, dentry); | 2256 | error = security_inode_unlink(dir, dentry); |
2278 | if (!error) | 2257 | if (!error) { |
2279 | error = dir->i_op->unlink(dir, dentry); | 2258 | error = dir->i_op->unlink(dir, dentry); |
2259 | if (!error) | ||
2260 | dentry->d_inode->i_flags |= S_DEAD; | ||
2261 | } | ||
2280 | } | 2262 | } |
2281 | mutex_unlock(&dentry->d_inode->i_mutex); | 2263 | mutex_unlock(&dentry->d_inode->i_mutex); |
2282 | 2264 | ||
@@ -2379,7 +2361,6 @@ int vfs_symlink(struct inode *dir, struct dentry *dentry, const char *oldname) | |||
2379 | if (error) | 2361 | if (error) |
2380 | return error; | 2362 | return error; |
2381 | 2363 | ||
2382 | vfs_dq_init(dir); | ||
2383 | error = dir->i_op->symlink(dir, dentry, oldname); | 2364 | error = dir->i_op->symlink(dir, dentry, oldname); |
2384 | if (!error) | 2365 | if (!error) |
2385 | fsnotify_create(dir, dentry); | 2366 | fsnotify_create(dir, dentry); |
@@ -2463,7 +2444,6 @@ int vfs_link(struct dentry *old_dentry, struct inode *dir, struct dentry *new_de | |||
2463 | return error; | 2444 | return error; |
2464 | 2445 | ||
2465 | mutex_lock(&inode->i_mutex); | 2446 | mutex_lock(&inode->i_mutex); |
2466 | vfs_dq_init(dir); | ||
2467 | error = dir->i_op->link(old_dentry, dir, new_dentry); | 2447 | error = dir->i_op->link(old_dentry, dir, new_dentry); |
2468 | mutex_unlock(&inode->i_mutex); | 2448 | mutex_unlock(&inode->i_mutex); |
2469 | if (!error) | 2449 | if (!error) |
@@ -2629,6 +2609,8 @@ static int vfs_rename_other(struct inode *old_dir, struct dentry *old_dentry, | |||
2629 | else | 2609 | else |
2630 | error = old_dir->i_op->rename(old_dir, old_dentry, new_dir, new_dentry); | 2610 | error = old_dir->i_op->rename(old_dir, old_dentry, new_dir, new_dentry); |
2631 | if (!error) { | 2611 | if (!error) { |
2612 | if (target) | ||
2613 | target->i_flags |= S_DEAD; | ||
2632 | if (!(old_dir->i_sb->s_type->fs_flags & FS_RENAME_DOES_D_MOVE)) | 2614 | if (!(old_dir->i_sb->s_type->fs_flags & FS_RENAME_DOES_D_MOVE)) |
2633 | d_move(old_dentry, new_dentry); | 2615 | d_move(old_dentry, new_dentry); |
2634 | } | 2616 | } |
@@ -2662,20 +2644,15 @@ int vfs_rename(struct inode *old_dir, struct dentry *old_dentry, | |||
2662 | if (!old_dir->i_op->rename) | 2644 | if (!old_dir->i_op->rename) |
2663 | return -EPERM; | 2645 | return -EPERM; |
2664 | 2646 | ||
2665 | vfs_dq_init(old_dir); | ||
2666 | vfs_dq_init(new_dir); | ||
2667 | |||
2668 | old_name = fsnotify_oldname_init(old_dentry->d_name.name); | 2647 | old_name = fsnotify_oldname_init(old_dentry->d_name.name); |
2669 | 2648 | ||
2670 | if (is_dir) | 2649 | if (is_dir) |
2671 | error = vfs_rename_dir(old_dir,old_dentry,new_dir,new_dentry); | 2650 | error = vfs_rename_dir(old_dir,old_dentry,new_dir,new_dentry); |
2672 | else | 2651 | else |
2673 | error = vfs_rename_other(old_dir,old_dentry,new_dir,new_dentry); | 2652 | error = vfs_rename_other(old_dir,old_dentry,new_dir,new_dentry); |
2674 | if (!error) { | 2653 | if (!error) |
2675 | const char *new_name = old_dentry->d_name.name; | 2654 | fsnotify_move(old_dir, new_dir, old_name, is_dir, |
2676 | fsnotify_move(old_dir, new_dir, old_name, new_name, is_dir, | ||
2677 | new_dentry->d_inode, old_dentry); | 2655 | new_dentry->d_inode, old_dentry); |
2678 | } | ||
2679 | fsnotify_oldname_free(old_name); | 2656 | fsnotify_oldname_free(old_name); |
2680 | 2657 | ||
2681 | return error; | 2658 | return error; |