diff options
Diffstat (limited to 'drivers/net/ethernet/mellanox/mlxsw/spectrum_router.c')
| -rw-r--r-- | drivers/net/ethernet/mellanox/mlxsw/spectrum_router.c | 1006 |
1 files changed, 1003 insertions, 3 deletions
diff --git a/drivers/net/ethernet/mellanox/mlxsw/spectrum_router.c b/drivers/net/ethernet/mellanox/mlxsw/spectrum_router.c index 7e3992a681b3..e084ea5448ac 100644 --- a/drivers/net/ethernet/mellanox/mlxsw/spectrum_router.c +++ b/drivers/net/ethernet/mellanox/mlxsw/spectrum_router.c | |||
| @@ -3,6 +3,7 @@ | |||
| 3 | * Copyright (c) 2016 Mellanox Technologies. All rights reserved. | 3 | * Copyright (c) 2016 Mellanox Technologies. All rights reserved. |
| 4 | * Copyright (c) 2016 Jiri Pirko <jiri@mellanox.com> | 4 | * Copyright (c) 2016 Jiri Pirko <jiri@mellanox.com> |
| 5 | * Copyright (c) 2016 Ido Schimmel <idosch@mellanox.com> | 5 | * Copyright (c) 2016 Ido Schimmel <idosch@mellanox.com> |
| 6 | * Copyright (c) 2016 Yotam Gigi <yotamg@mellanox.com> | ||
| 6 | * | 7 | * |
| 7 | * Redistribution and use in source and binary forms, with or without | 8 | * Redistribution and use in source and binary forms, with or without |
| 8 | * modification, are permitted provided that the following conditions are met: | 9 | * modification, are permitted provided that the following conditions are met: |
| @@ -38,6 +39,10 @@ | |||
| 38 | #include <linux/rhashtable.h> | 39 | #include <linux/rhashtable.h> |
| 39 | #include <linux/bitops.h> | 40 | #include <linux/bitops.h> |
| 40 | #include <linux/in6.h> | 41 | #include <linux/in6.h> |
| 42 | #include <linux/notifier.h> | ||
| 43 | #include <net/netevent.h> | ||
| 44 | #include <net/neighbour.h> | ||
| 45 | #include <net/arp.h> | ||
| 41 | 46 | ||
| 42 | #include "spectrum.h" | 47 | #include "spectrum.h" |
| 43 | #include "core.h" | 48 | #include "core.h" |
| @@ -112,6 +117,8 @@ enum mlxsw_sp_fib_entry_type { | |||
| 112 | MLXSW_SP_FIB_ENTRY_TYPE_TRAP, | 117 | MLXSW_SP_FIB_ENTRY_TYPE_TRAP, |
| 113 | }; | 118 | }; |
| 114 | 119 | ||
| 120 | struct mlxsw_sp_nexthop_group; | ||
| 121 | |||
| 115 | struct mlxsw_sp_fib_entry { | 122 | struct mlxsw_sp_fib_entry { |
| 116 | struct rhash_head ht_node; | 123 | struct rhash_head ht_node; |
| 117 | struct mlxsw_sp_fib_key key; | 124 | struct mlxsw_sp_fib_key key; |
| @@ -119,6 +126,8 @@ struct mlxsw_sp_fib_entry { | |||
| 119 | u8 added:1; | 126 | u8 added:1; |
| 120 | u16 rif; /* used for action local */ | 127 | u16 rif; /* used for action local */ |
| 121 | struct mlxsw_sp_vr *vr; | 128 | struct mlxsw_sp_vr *vr; |
| 129 | struct list_head nexthop_group_node; | ||
| 130 | struct mlxsw_sp_nexthop_group *nh_group; | ||
| 122 | }; | 131 | }; |
| 123 | 132 | ||
| 124 | struct mlxsw_sp_fib { | 133 | struct mlxsw_sp_fib { |
| @@ -544,6 +553,949 @@ static void mlxsw_sp_vrs_init(struct mlxsw_sp *mlxsw_sp) | |||
| 544 | } | 553 | } |
| 545 | } | 554 | } |
| 546 | 555 | ||
| 556 | struct mlxsw_sp_neigh_key { | ||
| 557 | unsigned char addr[sizeof(struct in6_addr)]; | ||
| 558 | struct net_device *dev; | ||
| 559 | }; | ||
| 560 | |||
| 561 | struct mlxsw_sp_neigh_entry { | ||
| 562 | struct rhash_head ht_node; | ||
| 563 | struct mlxsw_sp_neigh_key key; | ||
| 564 | u16 rif; | ||
| 565 | struct neighbour *n; | ||
| 566 | bool offloaded; | ||
| 567 | struct delayed_work dw; | ||
| 568 | struct mlxsw_sp_port *mlxsw_sp_port; | ||
| 569 | unsigned char ha[ETH_ALEN]; | ||
| 570 | struct list_head nexthop_list; /* list of nexthops using | ||
| 571 | * this neigh entry | ||
| 572 | */ | ||
| 573 | struct list_head nexthop_neighs_list_node; | ||
| 574 | }; | ||
| 575 | |||
| 576 | static const struct rhashtable_params mlxsw_sp_neigh_ht_params = { | ||
| 577 | .key_offset = offsetof(struct mlxsw_sp_neigh_entry, key), | ||
| 578 | .head_offset = offsetof(struct mlxsw_sp_neigh_entry, ht_node), | ||
| 579 | .key_len = sizeof(struct mlxsw_sp_neigh_key), | ||
| 580 | }; | ||
| 581 | |||
| 582 | static int | ||
| 583 | mlxsw_sp_neigh_entry_insert(struct mlxsw_sp *mlxsw_sp, | ||
| 584 | struct mlxsw_sp_neigh_entry *neigh_entry) | ||
| 585 | { | ||
| 586 | return rhashtable_insert_fast(&mlxsw_sp->router.neigh_ht, | ||
| 587 | &neigh_entry->ht_node, | ||
| 588 | mlxsw_sp_neigh_ht_params); | ||
| 589 | } | ||
| 590 | |||
| 591 | static void | ||
| 592 | mlxsw_sp_neigh_entry_remove(struct mlxsw_sp *mlxsw_sp, | ||
| 593 | struct mlxsw_sp_neigh_entry *neigh_entry) | ||
| 594 | { | ||
| 595 | rhashtable_remove_fast(&mlxsw_sp->router.neigh_ht, | ||
| 596 | &neigh_entry->ht_node, | ||
| 597 | mlxsw_sp_neigh_ht_params); | ||
| 598 | } | ||
| 599 | |||
| 600 | static void mlxsw_sp_router_neigh_update_hw(struct work_struct *work); | ||
| 601 | |||
| 602 | static struct mlxsw_sp_neigh_entry * | ||
| 603 | mlxsw_sp_neigh_entry_create(const void *addr, size_t addr_len, | ||
| 604 | struct net_device *dev, u16 rif, | ||
| 605 | struct neighbour *n) | ||
| 606 | { | ||
| 607 | struct mlxsw_sp_neigh_entry *neigh_entry; | ||
| 608 | |||
| 609 | neigh_entry = kzalloc(sizeof(*neigh_entry), GFP_ATOMIC); | ||
| 610 | if (!neigh_entry) | ||
| 611 | return NULL; | ||
| 612 | memcpy(neigh_entry->key.addr, addr, addr_len); | ||
| 613 | neigh_entry->key.dev = dev; | ||
| 614 | neigh_entry->rif = rif; | ||
| 615 | neigh_entry->n = n; | ||
| 616 | INIT_DELAYED_WORK(&neigh_entry->dw, mlxsw_sp_router_neigh_update_hw); | ||
| 617 | INIT_LIST_HEAD(&neigh_entry->nexthop_list); | ||
| 618 | return neigh_entry; | ||
| 619 | } | ||
| 620 | |||
| 621 | static void | ||
| 622 | mlxsw_sp_neigh_entry_destroy(struct mlxsw_sp_neigh_entry *neigh_entry) | ||
| 623 | { | ||
| 624 | kfree(neigh_entry); | ||
| 625 | } | ||
| 626 | |||
| 627 | static struct mlxsw_sp_neigh_entry * | ||
| 628 | mlxsw_sp_neigh_entry_lookup(struct mlxsw_sp *mlxsw_sp, const void *addr, | ||
| 629 | size_t addr_len, struct net_device *dev) | ||
| 630 | { | ||
| 631 | struct mlxsw_sp_neigh_key key = {{ 0 } }; | ||
| 632 | |||
| 633 | memcpy(key.addr, addr, addr_len); | ||
| 634 | key.dev = dev; | ||
| 635 | return rhashtable_lookup_fast(&mlxsw_sp->router.neigh_ht, | ||
| 636 | &key, mlxsw_sp_neigh_ht_params); | ||
| 637 | } | ||
| 638 | |||
| 639 | int mlxsw_sp_router_neigh_construct(struct net_device *dev, | ||
| 640 | struct neighbour *n) | ||
| 641 | { | ||
| 642 | struct mlxsw_sp_port *mlxsw_sp_port = netdev_priv(dev); | ||
| 643 | struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp; | ||
| 644 | struct mlxsw_sp_neigh_entry *neigh_entry; | ||
| 645 | struct mlxsw_sp_rif *r; | ||
| 646 | u32 dip; | ||
| 647 | int err; | ||
| 648 | |||
| 649 | if (n->tbl != &arp_tbl) | ||
| 650 | return 0; | ||
| 651 | |||
| 652 | dip = ntohl(*((__be32 *) n->primary_key)); | ||
| 653 | neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, &dip, sizeof(dip), | ||
| 654 | n->dev); | ||
| 655 | if (neigh_entry) { | ||
| 656 | WARN_ON(neigh_entry->n != n); | ||
| 657 | return 0; | ||
| 658 | } | ||
| 659 | |||
| 660 | r = mlxsw_sp_rif_find_by_dev(mlxsw_sp, dev); | ||
| 661 | if (WARN_ON(!r)) | ||
| 662 | return -EINVAL; | ||
| 663 | |||
| 664 | neigh_entry = mlxsw_sp_neigh_entry_create(&dip, sizeof(dip), n->dev, | ||
| 665 | r->rif, n); | ||
| 666 | if (!neigh_entry) | ||
| 667 | return -ENOMEM; | ||
| 668 | err = mlxsw_sp_neigh_entry_insert(mlxsw_sp, neigh_entry); | ||
| 669 | if (err) | ||
| 670 | goto err_neigh_entry_insert; | ||
| 671 | return 0; | ||
| 672 | |||
| 673 | err_neigh_entry_insert: | ||
| 674 | mlxsw_sp_neigh_entry_destroy(neigh_entry); | ||
| 675 | return err; | ||
| 676 | } | ||
| 677 | |||
| 678 | void mlxsw_sp_router_neigh_destroy(struct net_device *dev, | ||
| 679 | struct neighbour *n) | ||
| 680 | { | ||
| 681 | struct mlxsw_sp_port *mlxsw_sp_port = netdev_priv(dev); | ||
| 682 | struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp; | ||
| 683 | struct mlxsw_sp_neigh_entry *neigh_entry; | ||
| 684 | u32 dip; | ||
| 685 | |||
| 686 | if (n->tbl != &arp_tbl) | ||
| 687 | return; | ||
| 688 | |||
| 689 | dip = ntohl(*((__be32 *) n->primary_key)); | ||
| 690 | neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, &dip, sizeof(dip), | ||
| 691 | n->dev); | ||
| 692 | if (!neigh_entry) | ||
| 693 | return; | ||
| 694 | mlxsw_sp_neigh_entry_remove(mlxsw_sp, neigh_entry); | ||
| 695 | mlxsw_sp_neigh_entry_destroy(neigh_entry); | ||
| 696 | } | ||
| 697 | |||
| 698 | static void | ||
| 699 | mlxsw_sp_router_neighs_update_interval_init(struct mlxsw_sp *mlxsw_sp) | ||
| 700 | { | ||
| 701 | unsigned long interval = NEIGH_VAR(&arp_tbl.parms, DELAY_PROBE_TIME); | ||
| 702 | |||
| 703 | mlxsw_sp->router.neighs_update.interval = jiffies_to_msecs(interval); | ||
| 704 | } | ||
| 705 | |||
| 706 | static void mlxsw_sp_router_neigh_ent_ipv4_process(struct mlxsw_sp *mlxsw_sp, | ||
| 707 | char *rauhtd_pl, | ||
| 708 | int ent_index) | ||
| 709 | { | ||
| 710 | struct net_device *dev; | ||
| 711 | struct neighbour *n; | ||
| 712 | __be32 dipn; | ||
| 713 | u32 dip; | ||
| 714 | u16 rif; | ||
| 715 | |||
| 716 | mlxsw_reg_rauhtd_ent_ipv4_unpack(rauhtd_pl, ent_index, &rif, &dip); | ||
| 717 | |||
| 718 | if (!mlxsw_sp->rifs[rif]) { | ||
| 719 | dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Incorrect RIF in neighbour entry\n"); | ||
| 720 | return; | ||
| 721 | } | ||
| 722 | |||
| 723 | dipn = htonl(dip); | ||
| 724 | dev = mlxsw_sp->rifs[rif]->dev; | ||
| 725 | n = neigh_lookup(&arp_tbl, &dipn, dev); | ||
| 726 | if (!n) { | ||
| 727 | netdev_err(dev, "Failed to find matching neighbour for IP=%pI4h\n", | ||
| 728 | &dip); | ||
| 729 | return; | ||
| 730 | } | ||
| 731 | |||
| 732 | netdev_dbg(dev, "Updating neighbour with IP=%pI4h\n", &dip); | ||
| 733 | neigh_event_send(n, NULL); | ||
| 734 | neigh_release(n); | ||
| 735 | } | ||
| 736 | |||
| 737 | static void mlxsw_sp_router_neigh_rec_ipv4_process(struct mlxsw_sp *mlxsw_sp, | ||
| 738 | char *rauhtd_pl, | ||
| 739 | int rec_index) | ||
| 740 | { | ||
| 741 | u8 num_entries; | ||
| 742 | int i; | ||
| 743 | |||
| 744 | num_entries = mlxsw_reg_rauhtd_ipv4_rec_num_entries_get(rauhtd_pl, | ||
| 745 | rec_index); | ||
| 746 | /* Hardware starts counting at 0, so add 1. */ | ||
| 747 | num_entries++; | ||
| 748 | |||
| 749 | /* Each record consists of several neighbour entries. */ | ||
| 750 | for (i = 0; i < num_entries; i++) { | ||
| 751 | int ent_index; | ||
| 752 | |||
| 753 | ent_index = rec_index * MLXSW_REG_RAUHTD_IPV4_ENT_PER_REC + i; | ||
| 754 | mlxsw_sp_router_neigh_ent_ipv4_process(mlxsw_sp, rauhtd_pl, | ||
| 755 | ent_index); | ||
| 756 | } | ||
| 757 | |||
| 758 | } | ||
| 759 | |||
| 760 | static void mlxsw_sp_router_neigh_rec_process(struct mlxsw_sp *mlxsw_sp, | ||
| 761 | char *rauhtd_pl, int rec_index) | ||
| 762 | { | ||
| 763 | switch (mlxsw_reg_rauhtd_rec_type_get(rauhtd_pl, rec_index)) { | ||
| 764 | case MLXSW_REG_RAUHTD_TYPE_IPV4: | ||
| 765 | mlxsw_sp_router_neigh_rec_ipv4_process(mlxsw_sp, rauhtd_pl, | ||
| 766 | rec_index); | ||
| 767 | break; | ||
| 768 | case MLXSW_REG_RAUHTD_TYPE_IPV6: | ||
| 769 | WARN_ON_ONCE(1); | ||
| 770 | break; | ||
| 771 | } | ||
| 772 | } | ||
| 773 | |||
| 774 | static int mlxsw_sp_router_neighs_update_rauhtd(struct mlxsw_sp *mlxsw_sp) | ||
| 775 | { | ||
| 776 | char *rauhtd_pl; | ||
| 777 | u8 num_rec; | ||
| 778 | int i, err; | ||
| 779 | |||
| 780 | rauhtd_pl = kmalloc(MLXSW_REG_RAUHTD_LEN, GFP_KERNEL); | ||
| 781 | if (!rauhtd_pl) | ||
| 782 | return -ENOMEM; | ||
| 783 | |||
| 784 | /* Make sure the neighbour's netdev isn't removed in the | ||
| 785 | * process. | ||
| 786 | */ | ||
| 787 | rtnl_lock(); | ||
| 788 | do { | ||
| 789 | mlxsw_reg_rauhtd_pack(rauhtd_pl, MLXSW_REG_RAUHTD_TYPE_IPV4); | ||
| 790 | err = mlxsw_reg_query(mlxsw_sp->core, MLXSW_REG(rauhtd), | ||
| 791 | rauhtd_pl); | ||
| 792 | if (err) { | ||
| 793 | dev_err_ratelimited(mlxsw_sp->bus_info->dev, "Failed to dump neighbour talbe\n"); | ||
| 794 | break; | ||
| 795 | } | ||
| 796 | num_rec = mlxsw_reg_rauhtd_num_rec_get(rauhtd_pl); | ||
| 797 | for (i = 0; i < num_rec; i++) | ||
| 798 | mlxsw_sp_router_neigh_rec_process(mlxsw_sp, rauhtd_pl, | ||
| 799 | i); | ||
| 800 | } while (num_rec); | ||
| 801 | rtnl_unlock(); | ||
| 802 | |||
| 803 | kfree(rauhtd_pl); | ||
| 804 | return err; | ||
| 805 | } | ||
| 806 | |||
| 807 | static void mlxsw_sp_router_neighs_update_nh(struct mlxsw_sp *mlxsw_sp) | ||
| 808 | { | ||
| 809 | struct mlxsw_sp_neigh_entry *neigh_entry; | ||
| 810 | |||
| 811 | /* Take RTNL mutex here to prevent lists from changes */ | ||
| 812 | rtnl_lock(); | ||
| 813 | list_for_each_entry(neigh_entry, &mlxsw_sp->router.nexthop_neighs_list, | ||
| 814 | nexthop_neighs_list_node) { | ||
| 815 | /* If this neigh have nexthops, make the kernel think this neigh | ||
| 816 | * is active regardless of the traffic. | ||
| 817 | */ | ||
| 818 | if (!list_empty(&neigh_entry->nexthop_list)) | ||
| 819 | neigh_event_send(neigh_entry->n, NULL); | ||
| 820 | } | ||
| 821 | rtnl_unlock(); | ||
| 822 | } | ||
| 823 | |||
| 824 | static void | ||
| 825 | mlxsw_sp_router_neighs_update_work_schedule(struct mlxsw_sp *mlxsw_sp) | ||
| 826 | { | ||
| 827 | unsigned long interval = mlxsw_sp->router.neighs_update.interval; | ||
| 828 | |||
| 829 | mlxsw_core_schedule_dw(&mlxsw_sp->router.neighs_update.dw, | ||
| 830 | msecs_to_jiffies(interval)); | ||
| 831 | } | ||
| 832 | |||
| 833 | static void mlxsw_sp_router_neighs_update_work(struct work_struct *work) | ||
| 834 | { | ||
| 835 | struct mlxsw_sp *mlxsw_sp = container_of(work, struct mlxsw_sp, | ||
| 836 | router.neighs_update.dw.work); | ||
| 837 | int err; | ||
| 838 | |||
| 839 | err = mlxsw_sp_router_neighs_update_rauhtd(mlxsw_sp); | ||
| 840 | if (err) | ||
| 841 | dev_err(mlxsw_sp->bus_info->dev, "Could not update kernel for neigh activity"); | ||
| 842 | |||
| 843 | mlxsw_sp_router_neighs_update_nh(mlxsw_sp); | ||
| 844 | |||
| 845 | mlxsw_sp_router_neighs_update_work_schedule(mlxsw_sp); | ||
| 846 | } | ||
| 847 | |||
| 848 | static void mlxsw_sp_router_probe_unresolved_nexthops(struct work_struct *work) | ||
| 849 | { | ||
| 850 | struct mlxsw_sp_neigh_entry *neigh_entry; | ||
| 851 | struct mlxsw_sp *mlxsw_sp = container_of(work, struct mlxsw_sp, | ||
| 852 | router.nexthop_probe_dw.work); | ||
| 853 | |||
| 854 | /* Iterate over nexthop neighbours, find those who are unresolved and | ||
| 855 | * send arp on them. This solves the chicken-egg problem when | ||
| 856 | * the nexthop wouldn't get offloaded until the neighbor is resolved | ||
| 857 | * but it wouldn't get resolved ever in case traffic is flowing in HW | ||
| 858 | * using different nexthop. | ||
| 859 | * | ||
| 860 | * Take RTNL mutex here to prevent lists from changes. | ||
| 861 | */ | ||
| 862 | rtnl_lock(); | ||
| 863 | list_for_each_entry(neigh_entry, &mlxsw_sp->router.nexthop_neighs_list, | ||
| 864 | nexthop_neighs_list_node) { | ||
| 865 | if (!(neigh_entry->n->nud_state & NUD_VALID) && | ||
| 866 | !list_empty(&neigh_entry->nexthop_list)) | ||
| 867 | neigh_event_send(neigh_entry->n, NULL); | ||
| 868 | } | ||
| 869 | rtnl_unlock(); | ||
| 870 | |||
| 871 | mlxsw_core_schedule_dw(&mlxsw_sp->router.nexthop_probe_dw, | ||
| 872 | MLXSW_SP_UNRESOLVED_NH_PROBE_INTERVAL); | ||
| 873 | } | ||
| 874 | |||
| 875 | static void | ||
| 876 | mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp, | ||
| 877 | struct mlxsw_sp_neigh_entry *neigh_entry, | ||
| 878 | bool removing); | ||
| 879 | |||
| 880 | static void mlxsw_sp_router_neigh_update_hw(struct work_struct *work) | ||
| 881 | { | ||
| 882 | struct mlxsw_sp_neigh_entry *neigh_entry = | ||
| 883 | container_of(work, struct mlxsw_sp_neigh_entry, dw.work); | ||
| 884 | struct neighbour *n = neigh_entry->n; | ||
| 885 | struct mlxsw_sp_port *mlxsw_sp_port = neigh_entry->mlxsw_sp_port; | ||
| 886 | struct mlxsw_sp *mlxsw_sp = mlxsw_sp_port->mlxsw_sp; | ||
| 887 | char rauht_pl[MLXSW_REG_RAUHT_LEN]; | ||
| 888 | struct net_device *dev; | ||
| 889 | bool entry_connected; | ||
| 890 | u8 nud_state; | ||
| 891 | bool updating; | ||
| 892 | bool removing; | ||
| 893 | bool adding; | ||
| 894 | u32 dip; | ||
| 895 | int err; | ||
| 896 | |||
| 897 | read_lock_bh(&n->lock); | ||
| 898 | dip = ntohl(*((__be32 *) n->primary_key)); | ||
| 899 | memcpy(neigh_entry->ha, n->ha, sizeof(neigh_entry->ha)); | ||
| 900 | nud_state = n->nud_state; | ||
| 901 | dev = n->dev; | ||
| 902 | read_unlock_bh(&n->lock); | ||
| 903 | |||
| 904 | entry_connected = nud_state & NUD_VALID; | ||
| 905 | adding = (!neigh_entry->offloaded) && entry_connected; | ||
| 906 | updating = neigh_entry->offloaded && entry_connected; | ||
| 907 | removing = neigh_entry->offloaded && !entry_connected; | ||
| 908 | |||
| 909 | if (adding || updating) { | ||
| 910 | mlxsw_reg_rauht_pack4(rauht_pl, MLXSW_REG_RAUHT_OP_WRITE_ADD, | ||
| 911 | neigh_entry->rif, | ||
| 912 | neigh_entry->ha, dip); | ||
| 913 | err = mlxsw_reg_write(mlxsw_sp->core, | ||
| 914 | MLXSW_REG(rauht), rauht_pl); | ||
| 915 | if (err) { | ||
| 916 | netdev_err(dev, "Could not add neigh %pI4h\n", &dip); | ||
| 917 | neigh_entry->offloaded = false; | ||
| 918 | } else { | ||
| 919 | neigh_entry->offloaded = true; | ||
| 920 | } | ||
| 921 | mlxsw_sp_nexthop_neigh_update(mlxsw_sp, neigh_entry, false); | ||
| 922 | } else if (removing) { | ||
| 923 | mlxsw_reg_rauht_pack4(rauht_pl, MLXSW_REG_RAUHT_OP_WRITE_DELETE, | ||
| 924 | neigh_entry->rif, | ||
| 925 | neigh_entry->ha, dip); | ||
| 926 | err = mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(rauht), | ||
| 927 | rauht_pl); | ||
| 928 | if (err) { | ||
| 929 | netdev_err(dev, "Could not delete neigh %pI4h\n", &dip); | ||
| 930 | neigh_entry->offloaded = true; | ||
| 931 | } else { | ||
| 932 | neigh_entry->offloaded = false; | ||
| 933 | } | ||
| 934 | mlxsw_sp_nexthop_neigh_update(mlxsw_sp, neigh_entry, true); | ||
| 935 | } | ||
| 936 | |||
| 937 | neigh_release(n); | ||
| 938 | mlxsw_sp_port_dev_put(mlxsw_sp_port); | ||
| 939 | } | ||
| 940 | |||
| 941 | static int mlxsw_sp_router_netevent_event(struct notifier_block *unused, | ||
| 942 | unsigned long event, void *ptr) | ||
| 943 | { | ||
| 944 | struct mlxsw_sp_neigh_entry *neigh_entry; | ||
| 945 | struct mlxsw_sp_port *mlxsw_sp_port; | ||
| 946 | struct mlxsw_sp *mlxsw_sp; | ||
| 947 | unsigned long interval; | ||
| 948 | struct net_device *dev; | ||
| 949 | struct neigh_parms *p; | ||
| 950 | struct neighbour *n; | ||
| 951 | u32 dip; | ||
| 952 | |||
| 953 | switch (event) { | ||
| 954 | case NETEVENT_DELAY_PROBE_TIME_UPDATE: | ||
| 955 | p = ptr; | ||
| 956 | |||
| 957 | /* We don't care about changes in the default table. */ | ||
| 958 | if (!p->dev || p->tbl != &arp_tbl) | ||
| 959 | return NOTIFY_DONE; | ||
| 960 | |||
| 961 | /* We are in atomic context and can't take RTNL mutex, | ||
| 962 | * so use RCU variant to walk the device chain. | ||
| 963 | */ | ||
| 964 | mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(p->dev); | ||
| 965 | if (!mlxsw_sp_port) | ||
| 966 | return NOTIFY_DONE; | ||
| 967 | |||
| 968 | mlxsw_sp = mlxsw_sp_port->mlxsw_sp; | ||
| 969 | interval = jiffies_to_msecs(NEIGH_VAR(p, DELAY_PROBE_TIME)); | ||
| 970 | mlxsw_sp->router.neighs_update.interval = interval; | ||
| 971 | |||
| 972 | mlxsw_sp_port_dev_put(mlxsw_sp_port); | ||
| 973 | break; | ||
| 974 | case NETEVENT_NEIGH_UPDATE: | ||
| 975 | n = ptr; | ||
| 976 | dev = n->dev; | ||
| 977 | |||
| 978 | if (n->tbl != &arp_tbl) | ||
| 979 | return NOTIFY_DONE; | ||
| 980 | |||
| 981 | mlxsw_sp_port = mlxsw_sp_port_lower_dev_hold(dev); | ||
| 982 | if (!mlxsw_sp_port) | ||
| 983 | return NOTIFY_DONE; | ||
| 984 | |||
| 985 | mlxsw_sp = mlxsw_sp_port->mlxsw_sp; | ||
| 986 | dip = ntohl(*((__be32 *) n->primary_key)); | ||
| 987 | neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, | ||
| 988 | &dip, | ||
| 989 | sizeof(__be32), | ||
| 990 | dev); | ||
| 991 | if (WARN_ON(!neigh_entry) || WARN_ON(neigh_entry->n != n)) { | ||
| 992 | mlxsw_sp_port_dev_put(mlxsw_sp_port); | ||
| 993 | return NOTIFY_DONE; | ||
| 994 | } | ||
| 995 | neigh_entry->mlxsw_sp_port = mlxsw_sp_port; | ||
| 996 | |||
| 997 | /* Take a reference to ensure the neighbour won't be | ||
| 998 | * destructed until we drop the reference in delayed | ||
| 999 | * work. | ||
| 1000 | */ | ||
| 1001 | neigh_clone(n); | ||
| 1002 | if (!mlxsw_core_schedule_dw(&neigh_entry->dw, 0)) { | ||
| 1003 | neigh_release(n); | ||
| 1004 | mlxsw_sp_port_dev_put(mlxsw_sp_port); | ||
| 1005 | } | ||
| 1006 | break; | ||
| 1007 | } | ||
| 1008 | |||
| 1009 | return NOTIFY_DONE; | ||
| 1010 | } | ||
| 1011 | |||
| 1012 | static struct notifier_block mlxsw_sp_router_netevent_nb __read_mostly = { | ||
| 1013 | .notifier_call = mlxsw_sp_router_netevent_event, | ||
| 1014 | }; | ||
| 1015 | |||
| 1016 | static int mlxsw_sp_neigh_init(struct mlxsw_sp *mlxsw_sp) | ||
| 1017 | { | ||
| 1018 | int err; | ||
| 1019 | |||
| 1020 | err = rhashtable_init(&mlxsw_sp->router.neigh_ht, | ||
| 1021 | &mlxsw_sp_neigh_ht_params); | ||
| 1022 | if (err) | ||
| 1023 | return err; | ||
| 1024 | |||
| 1025 | /* Initialize the polling interval according to the default | ||
| 1026 | * table. | ||
| 1027 | */ | ||
| 1028 | mlxsw_sp_router_neighs_update_interval_init(mlxsw_sp); | ||
| 1029 | |||
| 1030 | err = register_netevent_notifier(&mlxsw_sp_router_netevent_nb); | ||
| 1031 | if (err) | ||
| 1032 | goto err_register_netevent_notifier; | ||
| 1033 | |||
| 1034 | /* Create the delayed works for the activity_update */ | ||
| 1035 | INIT_DELAYED_WORK(&mlxsw_sp->router.neighs_update.dw, | ||
| 1036 | mlxsw_sp_router_neighs_update_work); | ||
| 1037 | INIT_DELAYED_WORK(&mlxsw_sp->router.nexthop_probe_dw, | ||
| 1038 | mlxsw_sp_router_probe_unresolved_nexthops); | ||
| 1039 | mlxsw_core_schedule_dw(&mlxsw_sp->router.neighs_update.dw, 0); | ||
| 1040 | mlxsw_core_schedule_dw(&mlxsw_sp->router.nexthop_probe_dw, 0); | ||
| 1041 | return 0; | ||
| 1042 | |||
| 1043 | err_register_netevent_notifier: | ||
| 1044 | rhashtable_destroy(&mlxsw_sp->router.neigh_ht); | ||
| 1045 | return err; | ||
| 1046 | } | ||
| 1047 | |||
| 1048 | static void mlxsw_sp_neigh_fini(struct mlxsw_sp *mlxsw_sp) | ||
| 1049 | { | ||
| 1050 | cancel_delayed_work_sync(&mlxsw_sp->router.neighs_update.dw); | ||
| 1051 | cancel_delayed_work_sync(&mlxsw_sp->router.nexthop_probe_dw); | ||
| 1052 | unregister_netevent_notifier(&mlxsw_sp_router_netevent_nb); | ||
| 1053 | rhashtable_destroy(&mlxsw_sp->router.neigh_ht); | ||
| 1054 | } | ||
| 1055 | |||
| 1056 | struct mlxsw_sp_nexthop { | ||
| 1057 | struct list_head neigh_list_node; /* member of neigh entry list */ | ||
| 1058 | struct mlxsw_sp_nexthop_group *nh_grp; /* pointer back to the group | ||
| 1059 | * this belongs to | ||
| 1060 | */ | ||
| 1061 | u8 should_offload:1, /* set indicates this neigh is connected and | ||
| 1062 | * should be put to KVD linear area of this group. | ||
| 1063 | */ | ||
| 1064 | offloaded:1, /* set in case the neigh is actually put into | ||
| 1065 | * KVD linear area of this group. | ||
| 1066 | */ | ||
| 1067 | update:1; /* set indicates that MAC of this neigh should be | ||
| 1068 | * updated in HW | ||
| 1069 | */ | ||
| 1070 | struct mlxsw_sp_neigh_entry *neigh_entry; | ||
| 1071 | }; | ||
| 1072 | |||
| 1073 | struct mlxsw_sp_nexthop_group { | ||
| 1074 | struct list_head list; /* node in mlxsw->router.nexthop_group_list */ | ||
| 1075 | struct list_head fib_list; /* list of fib entries that use this group */ | ||
| 1076 | u8 adj_index_valid:1; | ||
| 1077 | u32 adj_index; | ||
| 1078 | u16 ecmp_size; | ||
| 1079 | u16 count; | ||
| 1080 | struct mlxsw_sp_nexthop nexthops[0]; | ||
| 1081 | }; | ||
| 1082 | |||
| 1083 | static int mlxsw_sp_adj_index_mass_update_vr(struct mlxsw_sp *mlxsw_sp, | ||
| 1084 | struct mlxsw_sp_vr *vr, | ||
| 1085 | u32 adj_index, u16 ecmp_size, | ||
| 1086 | u32 new_adj_index, | ||
| 1087 | u16 new_ecmp_size) | ||
| 1088 | { | ||
| 1089 | char raleu_pl[MLXSW_REG_RALEU_LEN]; | ||
| 1090 | |||
| 1091 | mlxsw_reg_raleu_pack(raleu_pl, vr->proto, vr->id, | ||
| 1092 | adj_index, ecmp_size, | ||
| 1093 | new_adj_index, new_ecmp_size); | ||
| 1094 | return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(raleu), raleu_pl); | ||
| 1095 | } | ||
| 1096 | |||
| 1097 | static int mlxsw_sp_adj_index_mass_update(struct mlxsw_sp *mlxsw_sp, | ||
| 1098 | struct mlxsw_sp_nexthop_group *nh_grp, | ||
| 1099 | u32 old_adj_index, u16 old_ecmp_size) | ||
| 1100 | { | ||
| 1101 | struct mlxsw_sp_fib_entry *fib_entry; | ||
| 1102 | struct mlxsw_sp_vr *vr = NULL; | ||
| 1103 | int err; | ||
| 1104 | |||
| 1105 | list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) { | ||
| 1106 | if (vr == fib_entry->vr) | ||
| 1107 | continue; | ||
| 1108 | vr = fib_entry->vr; | ||
| 1109 | err = mlxsw_sp_adj_index_mass_update_vr(mlxsw_sp, vr, | ||
| 1110 | old_adj_index, | ||
| 1111 | old_ecmp_size, | ||
| 1112 | nh_grp->adj_index, | ||
| 1113 | nh_grp->ecmp_size); | ||
| 1114 | if (err) | ||
| 1115 | return err; | ||
| 1116 | } | ||
| 1117 | return 0; | ||
| 1118 | } | ||
| 1119 | |||
| 1120 | static int mlxsw_sp_nexthop_mac_update(struct mlxsw_sp *mlxsw_sp, u32 adj_index, | ||
| 1121 | struct mlxsw_sp_nexthop *nh) | ||
| 1122 | { | ||
| 1123 | struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry; | ||
| 1124 | char ratr_pl[MLXSW_REG_RATR_LEN]; | ||
| 1125 | |||
| 1126 | mlxsw_reg_ratr_pack(ratr_pl, MLXSW_REG_RATR_OP_WRITE_WRITE_ENTRY, | ||
| 1127 | true, adj_index, neigh_entry->rif); | ||
| 1128 | mlxsw_reg_ratr_eth_entry_pack(ratr_pl, neigh_entry->ha); | ||
| 1129 | return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ratr), ratr_pl); | ||
| 1130 | } | ||
| 1131 | |||
| 1132 | static int | ||
| 1133 | mlxsw_sp_nexthop_group_mac_update(struct mlxsw_sp *mlxsw_sp, | ||
| 1134 | struct mlxsw_sp_nexthop_group *nh_grp) | ||
| 1135 | { | ||
| 1136 | u32 adj_index = nh_grp->adj_index; /* base */ | ||
| 1137 | struct mlxsw_sp_nexthop *nh; | ||
| 1138 | int i; | ||
| 1139 | int err; | ||
| 1140 | |||
| 1141 | for (i = 0; i < nh_grp->count; i++) { | ||
| 1142 | nh = &nh_grp->nexthops[i]; | ||
| 1143 | |||
| 1144 | if (!nh->should_offload) { | ||
| 1145 | nh->offloaded = 0; | ||
| 1146 | continue; | ||
| 1147 | } | ||
| 1148 | |||
| 1149 | if (nh->update) { | ||
| 1150 | err = mlxsw_sp_nexthop_mac_update(mlxsw_sp, | ||
| 1151 | adj_index, nh); | ||
| 1152 | if (err) | ||
| 1153 | return err; | ||
| 1154 | nh->update = 0; | ||
| 1155 | nh->offloaded = 1; | ||
| 1156 | } | ||
| 1157 | adj_index++; | ||
| 1158 | } | ||
| 1159 | return 0; | ||
| 1160 | } | ||
| 1161 | |||
| 1162 | static int mlxsw_sp_fib_entry_update(struct mlxsw_sp *mlxsw_sp, | ||
| 1163 | struct mlxsw_sp_fib_entry *fib_entry); | ||
| 1164 | |||
| 1165 | static int | ||
| 1166 | mlxsw_sp_nexthop_fib_entries_update(struct mlxsw_sp *mlxsw_sp, | ||
| 1167 | struct mlxsw_sp_nexthop_group *nh_grp) | ||
| 1168 | { | ||
| 1169 | struct mlxsw_sp_fib_entry *fib_entry; | ||
| 1170 | int err; | ||
| 1171 | |||
| 1172 | list_for_each_entry(fib_entry, &nh_grp->fib_list, nexthop_group_node) { | ||
| 1173 | err = mlxsw_sp_fib_entry_update(mlxsw_sp, fib_entry); | ||
| 1174 | if (err) | ||
| 1175 | return err; | ||
| 1176 | } | ||
| 1177 | return 0; | ||
| 1178 | } | ||
| 1179 | |||
| 1180 | static void | ||
| 1181 | mlxsw_sp_nexthop_group_refresh(struct mlxsw_sp *mlxsw_sp, | ||
| 1182 | struct mlxsw_sp_nexthop_group *nh_grp) | ||
| 1183 | { | ||
| 1184 | struct mlxsw_sp_nexthop *nh; | ||
| 1185 | bool offload_change = false; | ||
| 1186 | u32 adj_index; | ||
| 1187 | u16 ecmp_size = 0; | ||
| 1188 | bool old_adj_index_valid; | ||
| 1189 | u32 old_adj_index; | ||
| 1190 | u16 old_ecmp_size; | ||
| 1191 | int ret; | ||
| 1192 | int i; | ||
| 1193 | int err; | ||
| 1194 | |||
| 1195 | for (i = 0; i < nh_grp->count; i++) { | ||
| 1196 | nh = &nh_grp->nexthops[i]; | ||
| 1197 | |||
| 1198 | if (nh->should_offload ^ nh->offloaded) { | ||
| 1199 | offload_change = true; | ||
| 1200 | if (nh->should_offload) | ||
| 1201 | nh->update = 1; | ||
| 1202 | } | ||
| 1203 | if (nh->should_offload) | ||
| 1204 | ecmp_size++; | ||
| 1205 | } | ||
| 1206 | if (!offload_change) { | ||
| 1207 | /* Nothing was added or removed, so no need to reallocate. Just | ||
| 1208 | * update MAC on existing adjacency indexes. | ||
| 1209 | */ | ||
| 1210 | err = mlxsw_sp_nexthop_group_mac_update(mlxsw_sp, nh_grp); | ||
| 1211 | if (err) { | ||
| 1212 | dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n"); | ||
| 1213 | goto set_trap; | ||
| 1214 | } | ||
| 1215 | return; | ||
| 1216 | } | ||
| 1217 | if (!ecmp_size) | ||
| 1218 | /* No neigh of this group is connected so we just set | ||
| 1219 | * the trap and let everthing flow through kernel. | ||
| 1220 | */ | ||
| 1221 | goto set_trap; | ||
| 1222 | |||
| 1223 | ret = mlxsw_sp_kvdl_alloc(mlxsw_sp, ecmp_size); | ||
| 1224 | if (ret < 0) { | ||
| 1225 | /* We ran out of KVD linear space, just set the | ||
| 1226 | * trap and let everything flow through kernel. | ||
| 1227 | */ | ||
| 1228 | dev_warn(mlxsw_sp->bus_info->dev, "Failed to allocate KVD linear area for nexthop group.\n"); | ||
| 1229 | goto set_trap; | ||
| 1230 | } | ||
| 1231 | adj_index = ret; | ||
| 1232 | old_adj_index_valid = nh_grp->adj_index_valid; | ||
| 1233 | old_adj_index = nh_grp->adj_index; | ||
| 1234 | old_ecmp_size = nh_grp->ecmp_size; | ||
| 1235 | nh_grp->adj_index_valid = 1; | ||
| 1236 | nh_grp->adj_index = adj_index; | ||
| 1237 | nh_grp->ecmp_size = ecmp_size; | ||
| 1238 | err = mlxsw_sp_nexthop_group_mac_update(mlxsw_sp, nh_grp); | ||
| 1239 | if (err) { | ||
| 1240 | dev_warn(mlxsw_sp->bus_info->dev, "Failed to update neigh MAC in adjacency table.\n"); | ||
| 1241 | goto set_trap; | ||
| 1242 | } | ||
| 1243 | |||
| 1244 | if (!old_adj_index_valid) { | ||
| 1245 | /* The trap was set for fib entries, so we have to call | ||
| 1246 | * fib entry update to unset it and use adjacency index. | ||
| 1247 | */ | ||
| 1248 | err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp); | ||
| 1249 | if (err) { | ||
| 1250 | dev_warn(mlxsw_sp->bus_info->dev, "Failed to add adjacency index to fib entries.\n"); | ||
| 1251 | goto set_trap; | ||
| 1252 | } | ||
| 1253 | return; | ||
| 1254 | } | ||
| 1255 | |||
| 1256 | err = mlxsw_sp_adj_index_mass_update(mlxsw_sp, nh_grp, | ||
| 1257 | old_adj_index, old_ecmp_size); | ||
| 1258 | mlxsw_sp_kvdl_free(mlxsw_sp, old_adj_index); | ||
| 1259 | if (err) { | ||
| 1260 | dev_warn(mlxsw_sp->bus_info->dev, "Failed to mass-update adjacency index for nexthop group.\n"); | ||
| 1261 | goto set_trap; | ||
| 1262 | } | ||
| 1263 | return; | ||
| 1264 | |||
| 1265 | set_trap: | ||
| 1266 | old_adj_index_valid = nh_grp->adj_index_valid; | ||
| 1267 | nh_grp->adj_index_valid = 0; | ||
| 1268 | for (i = 0; i < nh_grp->count; i++) { | ||
| 1269 | nh = &nh_grp->nexthops[i]; | ||
| 1270 | nh->offloaded = 0; | ||
| 1271 | } | ||
| 1272 | err = mlxsw_sp_nexthop_fib_entries_update(mlxsw_sp, nh_grp); | ||
| 1273 | if (err) | ||
| 1274 | dev_warn(mlxsw_sp->bus_info->dev, "Failed to set traps for fib entries.\n"); | ||
| 1275 | if (old_adj_index_valid) | ||
| 1276 | mlxsw_sp_kvdl_free(mlxsw_sp, nh_grp->adj_index); | ||
| 1277 | } | ||
| 1278 | |||
| 1279 | static void __mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp_nexthop *nh, | ||
| 1280 | bool removing) | ||
| 1281 | { | ||
| 1282 | if (!removing && !nh->should_offload) | ||
| 1283 | nh->should_offload = 1; | ||
| 1284 | else if (removing && nh->offloaded) | ||
| 1285 | nh->should_offload = 0; | ||
| 1286 | nh->update = 1; | ||
| 1287 | } | ||
| 1288 | |||
| 1289 | static void | ||
| 1290 | mlxsw_sp_nexthop_neigh_update(struct mlxsw_sp *mlxsw_sp, | ||
| 1291 | struct mlxsw_sp_neigh_entry *neigh_entry, | ||
| 1292 | bool removing) | ||
| 1293 | { | ||
| 1294 | struct mlxsw_sp_nexthop *nh; | ||
| 1295 | |||
| 1296 | /* Take RTNL mutex here to prevent lists from changes */ | ||
| 1297 | rtnl_lock(); | ||
| 1298 | list_for_each_entry(nh, &neigh_entry->nexthop_list, | ||
| 1299 | neigh_list_node) { | ||
| 1300 | __mlxsw_sp_nexthop_neigh_update(nh, removing); | ||
| 1301 | mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh->nh_grp); | ||
| 1302 | } | ||
| 1303 | rtnl_unlock(); | ||
| 1304 | } | ||
| 1305 | |||
| 1306 | static int mlxsw_sp_nexthop_init(struct mlxsw_sp *mlxsw_sp, | ||
| 1307 | struct mlxsw_sp_nexthop_group *nh_grp, | ||
| 1308 | struct mlxsw_sp_nexthop *nh, | ||
| 1309 | struct fib_nh *fib_nh) | ||
| 1310 | { | ||
| 1311 | struct mlxsw_sp_neigh_entry *neigh_entry; | ||
| 1312 | u32 gwip = ntohl(fib_nh->nh_gw); | ||
| 1313 | struct net_device *dev = fib_nh->nh_dev; | ||
| 1314 | struct neighbour *n; | ||
| 1315 | u8 nud_state; | ||
| 1316 | |||
| 1317 | neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, &gwip, | ||
| 1318 | sizeof(gwip), dev); | ||
| 1319 | if (!neigh_entry) { | ||
| 1320 | __be32 gwipn = htonl(gwip); | ||
| 1321 | |||
| 1322 | n = neigh_create(&arp_tbl, &gwipn, dev); | ||
| 1323 | if (IS_ERR(n)) | ||
| 1324 | return PTR_ERR(n); | ||
| 1325 | neigh_event_send(n, NULL); | ||
| 1326 | neigh_entry = mlxsw_sp_neigh_entry_lookup(mlxsw_sp, &gwip, | ||
| 1327 | sizeof(gwip), dev); | ||
| 1328 | if (!neigh_entry) { | ||
| 1329 | neigh_release(n); | ||
| 1330 | return -EINVAL; | ||
| 1331 | } | ||
| 1332 | } else { | ||
| 1333 | /* Take a reference of neigh here ensuring that neigh would | ||
| 1334 | * not be detructed before the nexthop entry is finished. | ||
| 1335 | * The second branch takes the reference in neith_create() | ||
| 1336 | */ | ||
| 1337 | n = neigh_entry->n; | ||
| 1338 | neigh_clone(n); | ||
| 1339 | } | ||
| 1340 | |||
| 1341 | /* If that is the first nexthop connected to that neigh, add to | ||
| 1342 | * nexthop_neighs_list | ||
| 1343 | */ | ||
| 1344 | if (list_empty(&neigh_entry->nexthop_list)) | ||
| 1345 | list_add_tail(&neigh_entry->nexthop_neighs_list_node, | ||
| 1346 | &mlxsw_sp->router.nexthop_neighs_list); | ||
| 1347 | |||
| 1348 | nh->nh_grp = nh_grp; | ||
| 1349 | nh->neigh_entry = neigh_entry; | ||
| 1350 | list_add_tail(&nh->neigh_list_node, &neigh_entry->nexthop_list); | ||
| 1351 | read_lock_bh(&n->lock); | ||
| 1352 | nud_state = n->nud_state; | ||
| 1353 | read_unlock_bh(&n->lock); | ||
| 1354 | __mlxsw_sp_nexthop_neigh_update(nh, !(nud_state & NUD_VALID)); | ||
| 1355 | |||
| 1356 | return 0; | ||
| 1357 | } | ||
| 1358 | |||
| 1359 | static void mlxsw_sp_nexthop_fini(struct mlxsw_sp *mlxsw_sp, | ||
| 1360 | struct mlxsw_sp_nexthop *nh) | ||
| 1361 | { | ||
| 1362 | struct mlxsw_sp_neigh_entry *neigh_entry = nh->neigh_entry; | ||
| 1363 | |||
| 1364 | list_del(&nh->neigh_list_node); | ||
| 1365 | |||
| 1366 | /* If that is the last nexthop connected to that neigh, remove from | ||
| 1367 | * nexthop_neighs_list | ||
| 1368 | */ | ||
| 1369 | if (list_empty(&nh->neigh_entry->nexthop_list)) | ||
| 1370 | list_del(&nh->neigh_entry->nexthop_neighs_list_node); | ||
| 1371 | |||
| 1372 | neigh_release(neigh_entry->n); | ||
| 1373 | } | ||
| 1374 | |||
| 1375 | static struct mlxsw_sp_nexthop_group * | ||
| 1376 | mlxsw_sp_nexthop_group_create(struct mlxsw_sp *mlxsw_sp, struct fib_info *fi) | ||
| 1377 | { | ||
| 1378 | struct mlxsw_sp_nexthop_group *nh_grp; | ||
| 1379 | struct mlxsw_sp_nexthop *nh; | ||
| 1380 | struct fib_nh *fib_nh; | ||
| 1381 | size_t alloc_size; | ||
| 1382 | int i; | ||
| 1383 | int err; | ||
| 1384 | |||
| 1385 | alloc_size = sizeof(*nh_grp) + | ||
| 1386 | fi->fib_nhs * sizeof(struct mlxsw_sp_nexthop); | ||
| 1387 | nh_grp = kzalloc(alloc_size, GFP_KERNEL); | ||
| 1388 | if (!nh_grp) | ||
| 1389 | return ERR_PTR(-ENOMEM); | ||
| 1390 | INIT_LIST_HEAD(&nh_grp->fib_list); | ||
| 1391 | nh_grp->count = fi->fib_nhs; | ||
| 1392 | for (i = 0; i < nh_grp->count; i++) { | ||
| 1393 | nh = &nh_grp->nexthops[i]; | ||
| 1394 | fib_nh = &fi->fib_nh[i]; | ||
| 1395 | err = mlxsw_sp_nexthop_init(mlxsw_sp, nh_grp, nh, fib_nh); | ||
| 1396 | if (err) | ||
| 1397 | goto err_nexthop_init; | ||
| 1398 | } | ||
| 1399 | list_add_tail(&nh_grp->list, &mlxsw_sp->router.nexthop_group_list); | ||
| 1400 | mlxsw_sp_nexthop_group_refresh(mlxsw_sp, nh_grp); | ||
| 1401 | return nh_grp; | ||
| 1402 | |||
| 1403 | err_nexthop_init: | ||
| 1404 | for (i--; i >= 0; i--) | ||
| 1405 | mlxsw_sp_nexthop_fini(mlxsw_sp, nh); | ||
| 1406 | kfree(nh_grp); | ||
| 1407 | return ERR_PTR(err); | ||
| 1408 | } | ||
| 1409 | |||
| 1410 | static void | ||
| 1411 | mlxsw_sp_nexthop_group_destroy(struct mlxsw_sp *mlxsw_sp, | ||
| 1412 | struct mlxsw_sp_nexthop_group *nh_grp) | ||
| 1413 | { | ||
| 1414 | struct mlxsw_sp_nexthop *nh; | ||
| 1415 | int i; | ||
| 1416 | |||
| 1417 | list_del(&nh_grp->list); | ||
| 1418 | for (i = 0; i < nh_grp->count; i++) { | ||
| 1419 | nh = &nh_grp->nexthops[i]; | ||
| 1420 | mlxsw_sp_nexthop_fini(mlxsw_sp, nh); | ||
| 1421 | } | ||
| 1422 | kfree(nh_grp); | ||
| 1423 | } | ||
| 1424 | |||
| 1425 | static bool mlxsw_sp_nexthop_match(struct mlxsw_sp_nexthop *nh, | ||
| 1426 | struct fib_info *fi) | ||
| 1427 | { | ||
| 1428 | int i; | ||
| 1429 | |||
| 1430 | for (i = 0; i < fi->fib_nhs; i++) { | ||
| 1431 | struct fib_nh *fib_nh = &fi->fib_nh[i]; | ||
| 1432 | u32 gwip = ntohl(fib_nh->nh_gw); | ||
| 1433 | |||
| 1434 | if (memcmp(nh->neigh_entry->key.addr, | ||
| 1435 | &gwip, sizeof(u32)) == 0 && | ||
| 1436 | nh->neigh_entry->key.dev == fib_nh->nh_dev) | ||
| 1437 | return true; | ||
| 1438 | } | ||
| 1439 | return false; | ||
| 1440 | } | ||
| 1441 | |||
| 1442 | static bool mlxsw_sp_nexthop_group_match(struct mlxsw_sp_nexthop_group *nh_grp, | ||
| 1443 | struct fib_info *fi) | ||
| 1444 | { | ||
| 1445 | int i; | ||
| 1446 | |||
| 1447 | if (nh_grp->count != fi->fib_nhs) | ||
| 1448 | return false; | ||
| 1449 | for (i = 0; i < nh_grp->count; i++) { | ||
| 1450 | struct mlxsw_sp_nexthop *nh = &nh_grp->nexthops[i]; | ||
| 1451 | |||
| 1452 | if (!mlxsw_sp_nexthop_match(nh, fi)) | ||
| 1453 | return false; | ||
| 1454 | } | ||
| 1455 | return true; | ||
| 1456 | } | ||
| 1457 | |||
| 1458 | static struct mlxsw_sp_nexthop_group * | ||
| 1459 | mlxsw_sp_nexthop_group_find(struct mlxsw_sp *mlxsw_sp, struct fib_info *fi) | ||
| 1460 | { | ||
| 1461 | struct mlxsw_sp_nexthop_group *nh_grp; | ||
| 1462 | |||
| 1463 | list_for_each_entry(nh_grp, &mlxsw_sp->router.nexthop_group_list, | ||
| 1464 | list) { | ||
| 1465 | if (mlxsw_sp_nexthop_group_match(nh_grp, fi)) | ||
| 1466 | return nh_grp; | ||
| 1467 | } | ||
| 1468 | return NULL; | ||
| 1469 | } | ||
| 1470 | |||
| 1471 | static int mlxsw_sp_nexthop_group_get(struct mlxsw_sp *mlxsw_sp, | ||
| 1472 | struct mlxsw_sp_fib_entry *fib_entry, | ||
| 1473 | struct fib_info *fi) | ||
| 1474 | { | ||
| 1475 | struct mlxsw_sp_nexthop_group *nh_grp; | ||
| 1476 | |||
| 1477 | nh_grp = mlxsw_sp_nexthop_group_find(mlxsw_sp, fi); | ||
| 1478 | if (!nh_grp) { | ||
| 1479 | nh_grp = mlxsw_sp_nexthop_group_create(mlxsw_sp, fi); | ||
| 1480 | if (IS_ERR(nh_grp)) | ||
| 1481 | return PTR_ERR(nh_grp); | ||
| 1482 | } | ||
| 1483 | list_add_tail(&fib_entry->nexthop_group_node, &nh_grp->fib_list); | ||
| 1484 | fib_entry->nh_group = nh_grp; | ||
| 1485 | return 0; | ||
| 1486 | } | ||
| 1487 | |||
| 1488 | static void mlxsw_sp_nexthop_group_put(struct mlxsw_sp *mlxsw_sp, | ||
| 1489 | struct mlxsw_sp_fib_entry *fib_entry) | ||
| 1490 | { | ||
| 1491 | struct mlxsw_sp_nexthop_group *nh_grp = fib_entry->nh_group; | ||
| 1492 | |||
| 1493 | list_del(&fib_entry->nexthop_group_node); | ||
| 1494 | if (!list_empty(&nh_grp->fib_list)) | ||
| 1495 | return; | ||
| 1496 | mlxsw_sp_nexthop_group_destroy(mlxsw_sp, nh_grp); | ||
| 1497 | } | ||
| 1498 | |||
| 547 | static int __mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp) | 1499 | static int __mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp) |
| 548 | { | 1500 | { |
| 549 | char rgcr_pl[MLXSW_REG_RGCR_LEN]; | 1501 | char rgcr_pl[MLXSW_REG_RGCR_LEN]; |
| @@ -565,19 +1517,54 @@ int mlxsw_sp_router_init(struct mlxsw_sp *mlxsw_sp) | |||
| 565 | { | 1517 | { |
| 566 | int err; | 1518 | int err; |
| 567 | 1519 | ||
| 1520 | INIT_LIST_HEAD(&mlxsw_sp->router.nexthop_neighs_list); | ||
| 1521 | INIT_LIST_HEAD(&mlxsw_sp->router.nexthop_group_list); | ||
| 568 | err = __mlxsw_sp_router_init(mlxsw_sp); | 1522 | err = __mlxsw_sp_router_init(mlxsw_sp); |
| 569 | if (err) | 1523 | if (err) |
| 570 | return err; | 1524 | return err; |
| 571 | mlxsw_sp_lpm_init(mlxsw_sp); | 1525 | mlxsw_sp_lpm_init(mlxsw_sp); |
| 572 | mlxsw_sp_vrs_init(mlxsw_sp); | 1526 | mlxsw_sp_vrs_init(mlxsw_sp); |
| 573 | return 0; | 1527 | return mlxsw_sp_neigh_init(mlxsw_sp); |
| 574 | } | 1528 | } |
| 575 | 1529 | ||
| 576 | void mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp) | 1530 | void mlxsw_sp_router_fini(struct mlxsw_sp *mlxsw_sp) |
| 577 | { | 1531 | { |
| 1532 | mlxsw_sp_neigh_fini(mlxsw_sp); | ||
| 578 | __mlxsw_sp_router_fini(mlxsw_sp); | 1533 | __mlxsw_sp_router_fini(mlxsw_sp); |
| 579 | } | 1534 | } |
| 580 | 1535 | ||
| 1536 | static int mlxsw_sp_fib_entry_op4_remote(struct mlxsw_sp *mlxsw_sp, | ||
| 1537 | struct mlxsw_sp_fib_entry *fib_entry, | ||
| 1538 | enum mlxsw_reg_ralue_op op) | ||
| 1539 | { | ||
| 1540 | char ralue_pl[MLXSW_REG_RALUE_LEN]; | ||
| 1541 | u32 *p_dip = (u32 *) fib_entry->key.addr; | ||
| 1542 | struct mlxsw_sp_vr *vr = fib_entry->vr; | ||
| 1543 | enum mlxsw_reg_ralue_trap_action trap_action; | ||
| 1544 | u16 trap_id = 0; | ||
| 1545 | u32 adjacency_index = 0; | ||
| 1546 | u16 ecmp_size = 0; | ||
| 1547 | |||
| 1548 | /* In case the nexthop group adjacency index is valid, use it | ||
| 1549 | * with provided ECMP size. Otherwise, setup trap and pass | ||
| 1550 | * traffic to kernel. | ||
| 1551 | */ | ||
| 1552 | if (fib_entry->nh_group->adj_index_valid) { | ||
| 1553 | trap_action = MLXSW_REG_RALUE_TRAP_ACTION_NOP; | ||
| 1554 | adjacency_index = fib_entry->nh_group->adj_index; | ||
| 1555 | ecmp_size = fib_entry->nh_group->ecmp_size; | ||
| 1556 | } else { | ||
| 1557 | trap_action = MLXSW_REG_RALUE_TRAP_ACTION_TRAP; | ||
| 1558 | trap_id = MLXSW_TRAP_ID_RTR_INGRESS0; | ||
| 1559 | } | ||
| 1560 | |||
| 1561 | mlxsw_reg_ralue_pack4(ralue_pl, vr->proto, op, vr->id, | ||
| 1562 | fib_entry->key.prefix_len, *p_dip); | ||
| 1563 | mlxsw_reg_ralue_act_remote_pack(ralue_pl, trap_action, trap_id, | ||
| 1564 | adjacency_index, ecmp_size); | ||
| 1565 | return mlxsw_reg_write(mlxsw_sp->core, MLXSW_REG(ralue), ralue_pl); | ||
| 1566 | } | ||
| 1567 | |||
| 581 | static int mlxsw_sp_fib_entry_op4_local(struct mlxsw_sp *mlxsw_sp, | 1568 | static int mlxsw_sp_fib_entry_op4_local(struct mlxsw_sp *mlxsw_sp, |
| 582 | struct mlxsw_sp_fib_entry *fib_entry, | 1569 | struct mlxsw_sp_fib_entry *fib_entry, |
| 583 | enum mlxsw_reg_ralue_op op) | 1570 | enum mlxsw_reg_ralue_op op) |
| @@ -614,7 +1601,7 @@ static int mlxsw_sp_fib_entry_op4(struct mlxsw_sp *mlxsw_sp, | |||
| 614 | { | 1601 | { |
| 615 | switch (fib_entry->type) { | 1602 | switch (fib_entry->type) { |
| 616 | case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE: | 1603 | case MLXSW_SP_FIB_ENTRY_TYPE_REMOTE: |
| 617 | return -EINVAL; | 1604 | return mlxsw_sp_fib_entry_op4_remote(mlxsw_sp, fib_entry, op); |
| 618 | case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL: | 1605 | case MLXSW_SP_FIB_ENTRY_TYPE_LOCAL: |
| 619 | return mlxsw_sp_fib_entry_op4_local(mlxsw_sp, fib_entry, op); | 1606 | return mlxsw_sp_fib_entry_op4_local(mlxsw_sp, fib_entry, op); |
| 620 | case MLXSW_SP_FIB_ENTRY_TYPE_TRAP: | 1607 | case MLXSW_SP_FIB_ENTRY_TYPE_TRAP: |
| @@ -694,7 +1681,17 @@ mlxsw_sp_router_fib4_entry_init(struct mlxsw_sp *mlxsw_sp, | |||
| 694 | fib_entry->rif = r->rif; | 1681 | fib_entry->rif = r->rif; |
| 695 | return 0; | 1682 | return 0; |
| 696 | } | 1683 | } |
| 697 | return -EINVAL; | 1684 | fib_entry->type = MLXSW_SP_FIB_ENTRY_TYPE_REMOTE; |
| 1685 | return mlxsw_sp_nexthop_group_get(mlxsw_sp, fib_entry, fi); | ||
| 1686 | } | ||
| 1687 | |||
| 1688 | static void | ||
| 1689 | mlxsw_sp_router_fib4_entry_fini(struct mlxsw_sp *mlxsw_sp, | ||
| 1690 | struct mlxsw_sp_fib_entry *fib_entry) | ||
| 1691 | { | ||
| 1692 | if (fib_entry->type != MLXSW_SP_FIB_ENTRY_TYPE_REMOTE) | ||
| 1693 | return; | ||
| 1694 | mlxsw_sp_nexthop_group_put(mlxsw_sp, fib_entry); | ||
| 698 | } | 1695 | } |
| 699 | 1696 | ||
| 700 | static int | 1697 | static int |
| @@ -738,6 +1735,7 @@ mlxsw_sp_router_fib4_add_prepare(struct mlxsw_sp_port *mlxsw_sp_port, | |||
| 738 | return 0; | 1735 | return 0; |
| 739 | 1736 | ||
| 740 | err_alloc_info: | 1737 | err_alloc_info: |
| 1738 | mlxsw_sp_router_fib4_entry_fini(mlxsw_sp, fib_entry); | ||
| 741 | err_fib4_entry_init: | 1739 | err_fib4_entry_init: |
| 742 | mlxsw_sp_fib_entry_destroy(fib_entry); | 1740 | mlxsw_sp_fib_entry_destroy(fib_entry); |
| 743 | err_fib_entry_create: | 1741 | err_fib_entry_create: |
| @@ -772,6 +1770,7 @@ mlxsw_sp_router_fib4_add_commit(struct mlxsw_sp_port *mlxsw_sp_port, | |||
| 772 | err_fib_entry_add: | 1770 | err_fib_entry_add: |
| 773 | mlxsw_sp_fib_entry_remove(vr->fib, fib_entry); | 1771 | mlxsw_sp_fib_entry_remove(vr->fib, fib_entry); |
| 774 | err_fib_entry_insert: | 1772 | err_fib_entry_insert: |
| 1773 | mlxsw_sp_router_fib4_entry_fini(mlxsw_sp, fib_entry); | ||
| 775 | mlxsw_sp_fib_entry_destroy(fib_entry); | 1774 | mlxsw_sp_fib_entry_destroy(fib_entry); |
| 776 | mlxsw_sp_vr_put(mlxsw_sp, vr); | 1775 | mlxsw_sp_vr_put(mlxsw_sp, vr); |
| 777 | return err; | 1776 | return err; |
| @@ -808,6 +1807,7 @@ int mlxsw_sp_router_fib4_del(struct mlxsw_sp_port *mlxsw_sp_port, | |||
| 808 | } | 1807 | } |
| 809 | mlxsw_sp_fib_entry_del(mlxsw_sp_port->mlxsw_sp, fib_entry); | 1808 | mlxsw_sp_fib_entry_del(mlxsw_sp_port->mlxsw_sp, fib_entry); |
| 810 | mlxsw_sp_fib_entry_remove(vr->fib, fib_entry); | 1809 | mlxsw_sp_fib_entry_remove(vr->fib, fib_entry); |
| 1810 | mlxsw_sp_router_fib4_entry_fini(mlxsw_sp, fib_entry); | ||
| 811 | mlxsw_sp_fib_entry_destroy(fib_entry); | 1811 | mlxsw_sp_fib_entry_destroy(fib_entry); |
| 812 | mlxsw_sp_vr_put(mlxsw_sp, vr); | 1812 | mlxsw_sp_vr_put(mlxsw_sp, vr); |
| 813 | return 0; | 1813 | return 0; |
