1
1
openwrt/target/linux/realtek/files-6.18/drivers/net/dsa/rtl83xx/common.c
Jonas Jelonek a4965dbf48
realtek: migrate PCS to fwnode_pcs provider/consumer API
PCS driver registers each SerDes as an fwnode_pcs provider in probe;
the resolver returns the cached or freshly-allocated rtpcs_link for
the requested (sds, link_idx) cell. DSA glue stops calling
rtpcs_create directly, drops .mac_select_pcs, and instead populates
phylink_config.num_available_pcs / fill_available_pcs from each
port's pcs-handle in phylink_get_caps. The rtl838x_port.pcs pointer
becomes a has_pcs bool populated at port probe via fwnode_property_
present, since nothing assigns the actual phylink_pcs anymore but the
"does this port use a PCS?" checks elsewhere still need a presence
flag.

Without .mac_select_pcs, phylink_major_config only searches the
pcs_list when state->interface is set in phylink_config.pcs_interfaces
(drivers/net/phy/phylink.c:1378). Populate it per port whenever the
port has a pcs-handle, listing the SerDes-routable interface modes for
each SoC variant -- without this, pcs_config / pcs_link_up are never
called and the SerDes is left unconfigured.

pcs_get_state still needs the MAC port number to index per-port link
status registers. Recover it at probe via rtpcs_map_links: walk the
sibling switch's ethernet-ports subtree (same backwards topology
lookup the sibling MDIO driver does for phy-handle), and for every
port whose pcs-handle resolves to one of our SerDes, store the port's
reg in sds->link_port[]. The resolver consults link_port[] when
allocating rtpcs_link and fails with -ENODEV if a consumer requested
a link the map step didn't record. Avoids a driver-side port_base
table that would have to encode per-SoC SerDes-to-port wiring (and
would silently break on non-contiguous variants); the DT is the
single source of truth.

Kconfig selects FWNODE_PCS.

Assisted-by: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
Link: https://github.com/openwrt/openwrt/pull/23539
Signed-off-by: Jonas Jelonek <jelonek.jonas@gmail.com>
2026-05-31 12:52:41 +02:00

1810 lines
48 KiB
C

// SPDX-License-Identifier: GPL-2.0-only
#include <linux/of_mdio.h>
#include <linux/of_platform.h>
#include <net/arp.h>
#include <net/nexthop.h>
#include <net/neighbour.h>
#include <net/netevent.h>
#include <linux/etherdevice.h>
#include <linux/if_vlan.h>
#include <linux/inetdevice.h>
#include <linux/platform_device.h>
#include <linux/rhashtable.h>
#include <linux/of_net.h>
#include <asm/mach-rtl-otto/mach-rtl-otto.h>
#include "rtl-otto.h"
struct phylink_pcs *rtpcs_create(struct device *dev, struct device_node *np, int link_idx, int port);
int rtldsa_port_get_stp_state(struct rtl838x_switch_priv *priv, int port)
{
u32 msti = 0;
int state;
if (port >= priv->r->cpu_port)
return -EINVAL;
mutex_lock(&priv->reg_mutex);
state = priv->r->stp_get(priv, msti, port);
mutex_unlock(&priv->reg_mutex);
return state;
}
static struct table_reg rtl838x_tbl_regs[] = {
TBL_DESC(0x6900, 0x6908, 3, 15, 13, 1), /* RTL8380_TBL_L2 */
TBL_DESC(0x6914, 0x6918, 18, 14, 12, 1), /* RTL8380_TBL_0 */
TBL_DESC(0xA4C8, 0xA4CC, 6, 14, 12, 1), /* RTL8380_TBL_1 */
TBL_DESC(0x1180, 0x1184, 3, 16, 14, 0), /* RTL8390_TBL_L2 */
TBL_DESC(0x1190, 0x1194, 17, 15, 12, 0), /* RTL8390_TBL_0 */
TBL_DESC(0x6B80, 0x6B84, 4, 14, 12, 0), /* RTL8390_TBL_1 */
TBL_DESC(0x611C, 0x6120, 9, 8, 6, 0), /* RTL8390_TBL_2 */
TBL_DESC(0xB320, 0xB334, 3, 18, 16, 0), /* RTL9300_TBL_L2 */
TBL_DESC(0xB340, 0xB344, 19, 16, 12, 0), /* RTL9300_TBL_0 */
TBL_DESC(0xB3A0, 0xB3A4, 20, 16, 13, 0), /* RTL9300_TBL_1 */
TBL_DESC(0xCE04, 0xCE08, 6, 14, 12, 0), /* RTL9300_TBL_2 */
TBL_DESC(0xD600, 0xD604, 30, 7, 6, 0), /* RTL9300_TBL_HSB */
TBL_DESC(0x7880, 0x7884, 22, 9, 8, 0), /* RTL9300_TBL_HSA */
TBL_DESC(0x8500, 0x8508, 8, 19, 15, 0), /* RTL9310_TBL_0 */
TBL_DESC(0x40C0, 0x40C4, 22, 16, 14, 0), /* RTL9310_TBL_1 */
TBL_DESC(0x8528, 0x852C, 6, 18, 14, 0), /* RTL9310_TBL_2 */
TBL_DESC(0x0200, 0x0204, 9, 15, 12, 0), /* RTL9310_TBL_3 */
TBL_DESC(0x20dc, 0x20e0, 29, 7, 6, 0), /* RTL9310_TBL_4 */
TBL_DESC(0x7e1c, 0x7e20, 53, 8, 6, 0), /* RTL9310_TBL_5 */
};
void rtl_table_init(void)
{
for (int i = 0; i < RTL_TBL_END; i++)
mutex_init(&rtl838x_tbl_regs[i].lock);
}
/* Request access to table t in table access register r
* Returns a handle to a lock for that table
*/
struct table_reg *rtl_table_get(rtl838x_tbl_reg_t r, int t)
{
if (r >= RTL_TBL_END)
return NULL;
if (t >= BIT(rtl838x_tbl_regs[r].c_bit - rtl838x_tbl_regs[r].t_bit))
return NULL;
mutex_lock(&rtl838x_tbl_regs[r].lock);
rtl838x_tbl_regs[r].tbl = t;
return &rtl838x_tbl_regs[r];
}
/* Release a table r, unlock the corresponding lock */
void rtl_table_release(struct table_reg *r)
{
if (!r)
return;
/* pr_info("Unlocking %08x\n", (u32)r); */
mutex_unlock(&r->lock);
/* pr_info("Unlock done\n"); */
}
static int rtl_table_exec(struct table_reg *r, bool is_write, int idx)
{
int ret = 0;
u32 cmd, val;
/* Read/write bit has inverted meaning on RTL838x */
if (r->rmode)
cmd = is_write ? 0 : BIT(r->c_bit);
else
cmd = is_write ? BIT(r->c_bit) : 0;
cmd |= BIT(r->c_bit + 1); /* Execute bit */
cmd |= r->tbl << r->t_bit; /* Table type */
cmd |= idx & (BIT(r->t_bit) - 1); /* Index */
sw_w32(cmd, r->addr);
ret = readx_poll_timeout(sw_r32, r->addr, val,
!(val & BIT(r->c_bit + 1)), 20, 10000);
if (ret)
pr_err("%s: timeout\n", __func__);
return ret;
}
/* Reads table index idx into the data registers of the table */
int rtl_table_read(struct table_reg *r, int idx)
{
return rtl_table_exec(r, false, idx);
}
/* Writes the content of the table data registers into the table at index idx */
int rtl_table_write(struct table_reg *r, int idx)
{
return rtl_table_exec(r, true, idx);
}
/* Returns the address of the ith data register of table register r
* the address is relative to the beginning of the Switch-IO block at 0xbb000000
*/
inline u16 rtl_table_data(struct table_reg *r, int i)
{
if (i >= r->max_data)
i = r->max_data - 1;
return r->data + i * 4;
}
inline u32 rtl_table_data_r(struct table_reg *r, int i)
{
return sw_r32(rtl_table_data(r, i));
}
inline void rtl_table_data_w(struct table_reg *r, u32 v, int i)
{
sw_w32(v, rtl_table_data(r, i));
}
/* Port register accessor functions for the RTL838x and RTL930X SoCs */
void rtl838x_mask_port_reg(u64 clear, u64 set, int reg)
{
sw_w32_mask((u32)clear, (u32)set, reg);
}
void rtl838x_set_port_reg(u64 set, int reg)
{
sw_w32((u32)set, reg);
}
u64 rtl838x_get_port_reg(int reg)
{
return ((u64)sw_r32(reg));
}
/* Port register accessor functions for the RTL839x and RTL931X SoCs */
void rtl839x_mask_port_reg_be(u64 clear, u64 set, int reg)
{
sw_w32_mask((u32)(clear >> 32), (u32)(set >> 32), reg);
sw_w32_mask((u32)(clear & 0xffffffff), (u32)(set & 0xffffffff), reg + 4);
}
u64 rtl839x_get_port_reg_be(int reg)
{
u64 v = sw_r32(reg);
v <<= 32;
v |= sw_r32(reg + 4);
return v;
}
void rtl839x_set_port_reg_be(u64 set, int reg)
{
sw_w32(set >> 32, reg);
sw_w32(set & 0xffffffff, reg + 4);
}
void rtl839x_mask_port_reg_le(u64 clear, u64 set, int reg)
{
sw_w32_mask((u32)clear, (u32)set, reg);
sw_w32_mask((u32)(clear >> 32), (u32)(set >> 32), reg + 4);
}
void rtl839x_set_port_reg_le(u64 set, int reg)
{
sw_w32(set, reg);
sw_w32(set >> 32, reg + 4);
}
u64 rtl839x_get_port_reg_le(int reg)
{
u64 v = sw_r32(reg + 4);
v <<= 32;
v |= sw_r32(reg);
return v;
}
static bool rtldsa_phy_load_deferred(struct phy_device *phydev)
{
struct device *d = &phydev->mdio.dev;
if (d->driver)
return false;
return driver_deferred_probe_check_state(d) == -EPROBE_DEFER;
}
static bool rtldsa_phys_load_deferred(void)
{
struct device_node *phy_node;
struct phy_device *phydev;
struct device_node *dn;
bool deferred;
for_each_node_by_name(dn, "port") {
if (!of_device_is_available(dn))
continue;
phy_node = of_parse_phandle(dn, "phy-handle", 0);
if (!phy_node)
continue;
phydev = of_phy_find_device(phy_node);
of_node_put(phy_node);
if (!phydev)
continue;
deferred = rtldsa_phy_load_deferred(phydev);
put_device(&phydev->mdio.dev);
if (deferred) {
of_node_put(dn);
return true;
}
}
return false;
}
static int rtl83xx_mdio_probe(struct rtl838x_switch_priv *priv)
{
struct device_node *dn, *phy_node, *led_node;
u32 pn;
/* Check if all busses of Realtek mdio controller are registered */
dn = of_find_compatible_node(NULL, NULL, "realtek,otto-mdio");
if (!of_device_is_available(dn)) {
of_node_put(dn);
return -ENODEV;
}
for_each_child_of_node_scoped(dn, bn) {
struct mii_bus *bus = of_mdio_find_bus(bn);
if (!bus) {
of_node_put(dn);
return -EPROBE_DEFER;
}
put_device(&bus->dev);
}
of_node_put(dn);
dn = of_find_compatible_node(NULL, NULL, "realtek,otto-switch");
if (!dn) {
dev_err(priv->dev, "No RTL switch node in DTS\n");
return -ENODEV;
}
led_node = of_find_compatible_node(NULL, NULL, "realtek,rtl9300-leds");
for_each_node_by_name(dn, "port") {
u32 led_set;
char led_set_str[16] = {0};
if (!of_device_is_available(dn))
continue;
if (of_property_read_u32(dn, "reg", &pn))
continue;
phy_node = of_parse_phandle(dn, "phy-handle", 0);
priv->ports[pn].has_pcs = fwnode_property_present(of_fwnode_handle(dn),
"pcs-handle");
if (pn != priv->r->cpu_port && !phy_node && !priv->ports[pn].has_pcs) {
dev_err(priv->dev, "Port node %d has neither pcs-handle nor phy-handle\n", pn);
continue;
}
priv->ports[pn].leds_on_this_port = 0;
if (led_node) {
if (of_property_read_u32(dn, "led-set", &led_set))
led_set = 0;
priv->ports[pn].led_set = led_set;
sprintf(led_set_str, "led_set%d", led_set);
priv->ports[pn].leds_on_this_port = of_property_count_u32_elems(led_node, led_set_str);
if (priv->ports[pn].leds_on_this_port > 4) {
of_node_put(dn);
dev_err(priv->dev, "led_set %d for port %d configuration is invalid\n", led_set, pn);
return -ENODEV;
}
}
priv->ports[pn].phy = !!phy_node;
}
/* Disable MAC polling the PHY so that we can start configuration */
priv->r->set_port_reg_le(0ULL, priv->r->smi_poll_ctrl);
/* Disable PHY polling via SoC */
if (priv->family_id == RTL8390_FAMILY_ID)
sw_w32_mask(BIT(7), 0, RTL839X_SMI_GLB_CTRL);
return 0;
}
static int rtl83xx_get_l2aging(struct rtl838x_switch_priv *priv)
{
int t = sw_r32(priv->r->l2_ctrl_1);
t &= priv->family_id == RTL8380_FAMILY_ID ? 0x7fffff : 0x1FFFFF;
if (priv->family_id == RTL8380_FAMILY_ID)
t = t * 128 / 625; /* Aging time in seconds. 0: L2 aging disabled */
else
t = (t * 3) / 5;
pr_debug("L2 AGING time: %d sec\n", t);
pr_debug("Dynamic aging for ports: %x\n", sw_r32(priv->r->l2_port_aging_out));
return t;
}
/* Caller must hold priv->reg_mutex */
int rtl83xx_lag_add(struct dsa_switch *ds, int group, int port, struct netdev_lag_upper_info *info)
{
struct rtl838x_switch_priv *priv = ds->priv;
int ret;
int i;
for (i = 0; i < priv->ds->num_lag_ids; i++) {
if (priv->lags_port_members[i] & BIT_ULL(port))
break;
}
if (i != priv->ds->num_lag_ids) {
pr_err("%s: Port %d already member of LAG %d.\n", __func__, port, i);
return -ENOSPC;
}
if (priv->r->lag_setup_algomask) {
ret = priv->r->lag_setup_algomask(priv, group, info);
if (ret)
return ret;
}
ret = priv->r->lag_set_port_members(priv, group,
priv->lags_port_members[group] | BIT_ULL(port), info);
if (ret)
return ret;
pr_info("%s: Added port %d to LAG %d. Members now %016llx.\n",
__func__, port, group, priv->lags_port_members[group]);
return 0;
}
/* Caller must hold priv->reg_mutex */
int rtl83xx_lag_del(struct dsa_switch *ds, int group, int port)
{
struct rtl838x_switch_priv *priv = ds->priv;
int ret;
if (group >= priv->ds->num_lag_ids) {
pr_err("%s: LAG %d invalid.\n", __func__, group);
return -EINVAL;
}
if (!(priv->lags_port_members[group] & BIT_ULL(port))) {
pr_err("%s: Port %d not member of LAG %d.\n", __func__, port, group);
return -ENOSPC;
}
/* Don't touch hash mask bits, as only the port might be removed from
* the LAG group. This means the lag group stays valid with existing
* mask algo bits. If there are no lag members left, then
* rtl83xx_lag_add will reconfigure hash mask when new LAG group is
* created.
*/
ret = priv->r->lag_set_port_members(priv, group,
priv->lags_port_members[group] & ~BIT_ULL(port),
NULL);
if (ret)
return ret;
pr_info("%s: Removed port %d from LAG %d. Members now %016llx.\n",
__func__, port, group, priv->lags_port_members[group]);
return 0;
}
int rtldsa_93xx_lag_set_distribution_algorithm(struct rtl838x_switch_priv *priv,
int group, int algoidx, u32 algomsk)
{
bool is_l3 = false;
u32 newmask = 0;
if (algomsk & TRUNK_DISTRIBUTION_ALGO_SIP_BIT) {
is_l3 = true;
newmask |= TRUNK_DISTRIBUTION_ALGO_L3_SIP_BIT;
}
if (algomsk & TRUNK_DISTRIBUTION_ALGO_DIP_BIT) {
is_l3 = true;
newmask |= TRUNK_DISTRIBUTION_ALGO_L3_DIP_BIT;
}
if (algomsk & TRUNK_DISTRIBUTION_ALGO_SRC_L4PORT_BIT) {
is_l3 = true;
newmask |= TRUNK_DISTRIBUTION_ALGO_L3_SRC_L4PORT_BIT;
}
if (algomsk & TRUNK_DISTRIBUTION_ALGO_DST_L4PORT_BIT) {
is_l3 = true;
newmask |= TRUNK_DISTRIBUTION_ALGO_L3_DST_L4PORT_BIT;
}
if (is_l3) {
if (algomsk & TRUNK_DISTRIBUTION_ALGO_SPA_BIT)
newmask |= TRUNK_DISTRIBUTION_ALGO_L3_SPA_BIT;
if (algomsk & TRUNK_DISTRIBUTION_ALGO_SMAC_BIT)
newmask |= TRUNK_DISTRIBUTION_ALGO_L3_SMAC_BIT;
if (algomsk & TRUNK_DISTRIBUTION_ALGO_DMAC_BIT)
newmask |= TRUNK_DISTRIBUTION_ALGO_L3_DMAC_BIT;
if (algomsk & TRUNK_DISTRIBUTION_ALGO_VLAN_BIT)
newmask |= TRUNK_DISTRIBUTION_ALGO_L3_VLAN_BIT;
} else {
if (algomsk & TRUNK_DISTRIBUTION_ALGO_SPA_BIT)
newmask |= TRUNK_DISTRIBUTION_ALGO_L2_SPA_BIT;
if (algomsk & TRUNK_DISTRIBUTION_ALGO_SMAC_BIT)
newmask |= TRUNK_DISTRIBUTION_ALGO_L2_SMAC_BIT;
if (algomsk & TRUNK_DISTRIBUTION_ALGO_DMAC_BIT)
newmask |= TRUNK_DISTRIBUTION_ALGO_L2_DMAC_BIT;
if (algomsk & TRUNK_DISTRIBUTION_ALGO_VLAN_BIT)
newmask |= TRUNK_DISTRIBUTION_ALGO_L2_VLAN_BIT;
}
sw_w32(newmask, priv->r->trk_hash_ctrl + (algoidx << 2));
return 0;
}
int rtldsa_83xx_lag_setup_algomask(struct rtl838x_switch_priv *priv, int group,
struct netdev_lag_upper_info *info)
{
u32 algomsk = 0;
u32 algoidx = 0;
switch (info->hash_type) {
case NETDEV_LAG_HASH_L2:
algomsk |= TRUNK_DISTRIBUTION_ALGO_DMAC_BIT;
algomsk |= TRUNK_DISTRIBUTION_ALGO_SMAC_BIT;
break;
case NETDEV_LAG_HASH_L23:
algomsk |= TRUNK_DISTRIBUTION_ALGO_DMAC_BIT;
algomsk |= TRUNK_DISTRIBUTION_ALGO_SMAC_BIT;
algomsk |= TRUNK_DISTRIBUTION_ALGO_SIP_BIT; /* source ip */
algomsk |= TRUNK_DISTRIBUTION_ALGO_DIP_BIT; /* dest ip */
algoidx = 1;
break;
case NETDEV_LAG_HASH_L34:
algomsk |= TRUNK_DISTRIBUTION_ALGO_SRC_L4PORT_BIT; /* sport */
algomsk |= TRUNK_DISTRIBUTION_ALGO_DST_L4PORT_BIT; /* dport */
algomsk |= TRUNK_DISTRIBUTION_ALGO_SIP_BIT; /* source ip */
algomsk |= TRUNK_DISTRIBUTION_ALGO_DIP_BIT; /* dest ip */
algoidx = 2;
break;
default:
algomsk |= TRUNK_DISTRIBUTION_ALGO_MASKALL;
}
return priv->r->lag_set_distribution_algorithm(priv, group, algoidx, algomsk);
}
static int rtldsa_93xx_lag_set_group2ports(struct rtl838x_switch_priv *priv, int group,
struct netdev_lag_upper_info *info)
{
DECLARE_BITMAP(ports, ARRAY_SIZE(priv->ports));
struct rtldsa_93xx_lag_entry e;
unsigned int table_pos = 0;
u8 num_of_lag_ports = 0;
u8 group_ports[8];
u32 data[3];
int i;
/* Read lag table using Table control register 2 */
struct table_reg *r = priv->r->lag_table();
rtl_table_read(r, group);
bitmap_clear(ports, 0, ARRAY_SIZE(priv->ports));
bitmap_from_arr64(ports, &priv->lags_port_members[group],
ARRAY_SIZE(priv->ports));
for (i = 0; i < 3; i++)
data[i] = sw_r32(rtl_table_data(r, i));
priv->r->lag_fill_data(data, &e);
num_of_lag_ports = bitmap_weight(ports, ARRAY_SIZE(priv->ports));
if (num_of_lag_ports > ARRAY_SIZE(group_ports)) {
pr_err("%s: Number of LAG ports too high: %u", __func__,
num_of_lag_ports);
return -ENOSPC;
}
memset(group_ports, 0x3f, sizeof(group_ports));
table_pos = 0;
for_each_set_bit(i, ports, ARRAY_SIZE(priv->ports)) {
if (!priv->ports[i].dp->lag_tx_enabled)
continue;
group_ports[table_pos] = i;
table_pos++;
}
/* Remove tx disabled ports */
num_of_lag_ports = table_pos;
e.trk_dev0 = 0;
e.trk_port0 = group_ports[0];
e.trk_dev1 = 0;
e.trk_port1 = group_ports[1];
e.trk_dev2 = 0;
e.trk_port2 = group_ports[2];
e.trk_dev3 = 0;
e.trk_port3 = group_ports[3];
e.trk_dev4 = 0;
e.trk_port4 = group_ports[4];
e.trk_dev5 = 0;
e.trk_port5 = group_ports[5];
e.trk_dev6 = 0;
e.trk_port6 = group_ports[6];
e.trk_dev7 = 0;
e.trk_port7 = group_ports[7];
e.num_tx_candi = num_of_lag_ports;
/* set hash_mask_idx to 0 if we are deleting lag group */
if (info) {
if (info->hash_type == NETDEV_LAG_HASH_L2) {
e.l2_hash_mask_idx = RTL93XX_HASH_MASK_INDEX_L2;
e.ip4_hash_mask_idx = RTL93XX_HASH_MASK_INDEX_L2;
e.ip6_hash_mask_idx = RTL93XX_HASH_MASK_INDEX_L2;
} else if (info->hash_type == NETDEV_LAG_HASH_L23) {
e.l2_hash_mask_idx = RTL93XX_HASH_MASK_INDEX_L23;
e.ip4_hash_mask_idx = RTL93XX_HASH_MASK_INDEX_L23;
e.ip6_hash_mask_idx = RTL93XX_HASH_MASK_INDEX_L23;
} else {
return -EOPNOTSUPP;
}
}
priv->r->lag_write_data(data, &e);
for (i = 0; i < 3; i++)
sw_w32(data[i], rtl_table_data(r, i));
rtl_table_write(r, group);
rtl_table_release(r);
return 0;
}
static inline void rtldsa_93xx_lag_set_local_group2ports(struct rtl838x_switch_priv *priv, int group,
u64 ports)
{
priv->r->set_port_reg_be(ports, priv->r->trk_mbr_ctr(group));
}
int rtldsa_93xx_lag_set_port_members(struct rtl838x_switch_priv *priv, int group,
u64 members, struct netdev_lag_upper_info *info)
{
DECLARE_BITMAP(affected_members, ARRAY_SIZE(priv->ports));
bool valid_group;
u64 old_members;
u64 affected;
size_t port;
int ret;
/* calculate modifications of the LAG group */
old_members = priv->lags_port_members[group];
priv->lags_port_members[group] = members;
affected = old_members | priv->lags_port_members[group];
bitmap_clear(affected_members, 0, ARRAY_SIZE(priv->ports));
bitmap_from_arr64(affected_members, &affected, BITS_PER_TYPE(affected));
valid_group = __sw_hweight64(priv->lags_port_members[group]);
/* apply global group and port settings */
ret = rtldsa_93xx_lag_set_group2ports(priv, group, info);
if (ret)
return ret;
for_each_set_bit(port, affected_members, ARRAY_SIZE(priv->ports)) {
bool valid = priv->lags_port_members[group] & BIT_ULL(port);
priv->r->lag_set_port2group(group, port, valid);
}
/* apply local group and port settings */
priv->r->lag_set_local_group_id(group, group, valid_group);
rtldsa_93xx_lag_set_local_group2ports(priv, group, priv->lags_port_members[group]);
for_each_set_bit(port, affected_members, ARRAY_SIZE(priv->ports)) {
bool valid = priv->lags_port_members[group] & BIT_ULL(port);
priv->r->lag_set_local_port2group(group, port, valid);
}
/* write lag table (and maybe additional information) to SRAM */
priv->r->lag_sync_tables();
return 0;
}
// Currently Unused
// /* Allocate a 64 bit octet counter located in the LOG HW table */
// static int rtl83xx_octet_cntr_alloc(struct rtl838x_switch_priv *priv)
// {
// int idx;
// mutex_lock(&priv->reg_mutex);
// idx = find_first_zero_bit(priv->octet_cntr_use_bm, MAX_COUNTERS);
// if (idx >= priv->r->n_counters) {
// mutex_unlock(&priv->reg_mutex);
// return -1;
// }
// set_bit(idx, priv->octet_cntr_use_bm);
// mutex_unlock(&priv->reg_mutex);
// return idx;
// }
/* Allocate a 32-bit packet counter
* 2 32-bit packet counters share the location of a 64-bit octet counter
* Initially there are no free packet counters and 2 new ones need to be freed
* by allocating the corresponding octet counter
*/
int rtl83xx_packet_cntr_alloc(struct rtl838x_switch_priv *priv)
{
int idx, j;
mutex_lock(&priv->reg_mutex);
/* Because initially no packet counters are free, the logic is reversed:
* a 0-bit means the counter is already allocated (for octets)
*/
idx = find_first_bit(priv->packet_cntr_use_bm, MAX_COUNTERS * 2);
if (idx >= priv->r->n_counters * 2) {
j = find_first_zero_bit(priv->octet_cntr_use_bm, MAX_COUNTERS);
if (j >= priv->r->n_counters) {
mutex_unlock(&priv->reg_mutex);
return -1;
}
set_bit(j, priv->octet_cntr_use_bm);
idx = j * 2;
set_bit(j * 2 + 1, priv->packet_cntr_use_bm);
} else {
clear_bit(idx, priv->packet_cntr_use_bm);
}
mutex_unlock(&priv->reg_mutex);
return idx;
}
/* Add an L2 nexthop entry for the L3 routing system / PIE forwarding in the SoC
* Use VID and MAC in rtl838x_l2_entry to identify either a free slot in the L2 hash table
* or mark an existing entry as a nexthop by setting it's nexthop bit
* Called from the L3 layer
* The index in the L2 hash table is filled into nh->l2_id;
*/
static int rtl83xx_l2_nexthop_add(struct rtl838x_switch_priv *priv, struct rtl83xx_nexthop *nh)
{
struct rtl838x_l2_entry e;
u64 seed = priv->r->l2_hash_seed(nh->mac, nh->rvid);
u32 key = priv->r->l2_hash_key(priv, seed);
int idx = -1;
u64 entry;
pr_debug("%s searching for %08llx vid %d with key %d, seed: %016llx\n",
__func__, nh->mac, nh->rvid, key, seed);
e.type = L2_UNICAST;
u64_to_ether_addr(nh->mac, &e.mac[0]);
e.port = nh->port;
/* Loop over all entries in the hash-bucket and over the second block on 93xx SoCs */
for (int i = 0; i < priv->r->l2_bucket_size; i++) {
entry = priv->r->read_l2_entry_using_hash(key, i, &e);
if (!e.valid || ((entry & 0x0fffffffffffffffULL) == seed)) {
idx = i > 3 ? ((key >> 14) & 0xffff) | i >> 1
: ((key << 2) | i) & 0xffff;
break;
}
}
if (idx < 0) {
pr_err("%s: No more L2 forwarding entries available\n", __func__);
return -1;
}
/* Found an existing (e->valid is true) or empty entry, make it a nexthop entry */
nh->l2_id = idx;
if (e.valid) {
nh->port = e.port;
nh->vid = e.vid; /* Save VID */
nh->rvid = e.rvid;
nh->dev_id = e.stack_dev;
/* If the entry is already a valid next hop entry, don't change it */
if (e.next_hop)
return 0;
} else {
e.valid = true;
e.is_static = true;
e.rvid = nh->rvid;
e.is_ip_mc = false;
e.is_ipv6_mc = false;
e.block_da = false;
e.block_sa = false;
e.suspended = false;
e.age = 0; /* With port-ignore */
e.port = priv->r->port_ignore;
u64_to_ether_addr(nh->mac, &e.mac[0]);
}
e.next_hop = true;
e.nh_route_id = nh->id; /* NH route ID takes place of VID */
e.nh_vlan_target = false;
priv->r->write_l2_entry_using_hash(idx >> 2, idx & 0x3, &e);
return 0;
}
/* Removes a Layer 2 next hop entry in the forwarding database
* If it was static, the entire entry is removed, otherwise the nexthop bit is cleared
* and we wait until the entry ages out
*/
static int rtl83xx_l2_nexthop_rm(struct rtl838x_switch_priv *priv, struct rtl83xx_nexthop *nh)
{
struct rtl838x_l2_entry e;
u32 key = nh->l2_id >> 2;
int i = nh->l2_id & 0x3;
u64 entry = entry = priv->r->read_l2_entry_using_hash(key, i, &e);
pr_debug("%s: id %d, key %d, index %d\n", __func__, nh->l2_id, key, i);
if (!e.valid) {
dev_err(priv->dev, "unknown nexthop, id %x\n", nh->l2_id);
return -1;
}
if (e.is_static)
e.valid = false;
e.next_hop = false;
e.vid = nh->vid; /* Restore VID */
e.rvid = nh->rvid;
priv->r->write_l2_entry_using_hash(key, i, &e);
return 0;
}
int rtl83xx_port_is_under(const struct net_device *dev, struct rtl838x_switch_priv *priv)
{
/* Is the lower network device a DSA user network device of our RTL930X-switch?
* Unfortunately we cannot just follow dev->dsa_prt as this is only set for the
* DSA conduit device. TODO: since 6.12:
*
* if(!dsa_user_dev_check(dev)) {
* netdev_info(dev, "%s: not a DSA device.\n", __func__);
* return -EINVAL;
* }
*/
for (int i = 0; i < priv->r->cpu_port; i++) {
if (!priv->ports[i].dp)
continue;
if (priv->ports[i].dp->user == dev)
return i;
}
return -EINVAL;
}
static const struct rhashtable_params route_ht_params = {
.key_len = sizeof(u32),
.key_offset = offsetof(struct rtl83xx_route, gw_ip),
.head_offset = offsetof(struct rtl83xx_route, linkage),
};
/* Updates an L3 next hop entry in the ROUTING table */
static int rtl83xx_l3_nexthop_update(struct rtl838x_switch_priv *priv, __be32 ip_addr, u64 mac)
{
struct rtl83xx_route *r;
struct rhlist_head *tmp, *list;
rcu_read_lock();
list = rhltable_lookup(&priv->routes, &ip_addr, route_ht_params);
if (!list) {
rcu_read_unlock();
return -ENOENT;
}
rhl_for_each_entry_rcu(r, tmp, list, linkage) {
pr_debug("%s: Setting up fwding: ip %pI4, GW mac %016llx\n",
__func__, &ip_addr, mac);
/* Reads the ROUTING table entry associated with the route */
priv->r->route_read(r->id, r);
pr_debug("Route with id %d to %pI4 / %d\n", r->id, &r->dst_ip, r->prefix_len);
r->nh.mac = r->nh.gw = mac;
r->nh.port = priv->r->port_ignore;
r->nh.id = r->id;
/* Do we need to explicitly add a DMAC entry with the route's nh index? */
if (priv->r->set_l3_egress_mac)
priv->r->set_l3_egress_mac(r->id, mac);
/* Update ROUTING table: map gateway-mac and switch-mac id to route id */
rtl83xx_l2_nexthop_add(priv, &r->nh);
r->attr.valid = true;
r->attr.action = ROUTE_ACT_FORWARD;
r->attr.type = 0;
r->attr.hit = false; /* Reset route-used indicator */
/* Add PIE entry with dst_ip and prefix_len */
r->pr.dip = r->dst_ip;
r->pr.dip_m = inet_make_mask(r->prefix_len);
if (r->is_host_route) {
int slot = priv->r->find_l3_slot(r, false);
pr_info("%s: Got slot for route: %d\n", __func__, slot);
priv->r->host_route_write(slot, r);
} else {
priv->r->route_write(r->id, r);
r->pr.fwd_sel = true;
r->pr.fwd_data = r->nh.l2_id;
r->pr.fwd_act = PIE_ACT_ROUTE_UC;
}
if (priv->r->set_l3_nexthop)
priv->r->set_l3_nexthop(r->nh.id, r->nh.l2_id, r->nh.if_id);
if (r->pr.id < 0) {
r->pr.packet_cntr = rtl83xx_packet_cntr_alloc(priv);
if (r->pr.packet_cntr >= 0) {
pr_info("Using packet counter %d\n", r->pr.packet_cntr);
r->pr.log_sel = true;
r->pr.log_data = r->pr.packet_cntr;
}
priv->r->pie_rule_add(priv, &r->pr);
} else {
int pkts = priv->r->packet_cntr_read(r->pr.packet_cntr);
pr_debug("%s: total packets: %d\n", __func__, pkts);
priv->r->pie_rule_write(priv, r->pr.id, &r->pr);
}
}
rcu_read_unlock();
return 0;
}
static int rtl83xx_port_ipv4_resolve(struct rtl838x_switch_priv *priv,
struct net_device *dev, __be32 ip_addr)
{
struct neighbour *n = neigh_lookup(&arp_tbl, &ip_addr, dev);
int err = 0;
u64 mac;
if (!n) {
n = neigh_create(&arp_tbl, &ip_addr, dev);
if (IS_ERR(n))
return PTR_ERR(n);
}
/* If the neigh is already resolved, then go ahead and
* install the entry, otherwise start the ARP process to
* resolve the neigh.
*/
if (n->nud_state & NUD_VALID) {
mac = ether_addr_to_u64(n->ha);
pr_info("%s: resolved mac: %016llx\n", __func__, mac);
rtl83xx_l3_nexthop_update(priv, ip_addr, mac);
} else {
pr_info("%s: need to wait\n", __func__);
neigh_event_send(n, NULL);
}
neigh_release(n);
return err;
}
struct rtl83xx_walk_data {
struct rtl838x_switch_priv *priv;
int port;
};
static int rtl83xx_port_lower_walk(struct net_device *lower, struct netdev_nested_priv *_priv)
{
struct rtl83xx_walk_data *data = (struct rtl83xx_walk_data *)_priv->data;
struct rtl838x_switch_priv *priv = data->priv;
int ret = 0;
int index;
index = rtl83xx_port_is_under(lower, priv);
data->port = index;
if (index >= 0) {
pr_debug("Found DSA-port, index %d\n", index);
ret = 1;
}
return ret;
}
static int rtl83xx_port_dev_lower_find(struct net_device *dev, struct rtl838x_switch_priv *priv)
{
struct rtl83xx_walk_data data;
struct netdev_nested_priv _priv;
data.priv = priv;
data.port = 0;
_priv.data = (void *)&data;
netdev_walk_all_lower_dev(dev, rtl83xx_port_lower_walk, &_priv);
return data.port;
}
static struct rtl83xx_route *rtl83xx_route_alloc(struct rtl838x_switch_priv *priv, u32 ip)
{
struct rtl83xx_route *r;
int idx = 0, err;
mutex_lock(&priv->reg_mutex);
idx = find_first_zero_bit(priv->route_use_bm, MAX_ROUTES);
pr_debug("%s id: %d, ip %pI4\n", __func__, idx, &ip);
r = kzalloc(sizeof(*r), GFP_KERNEL);
if (!r) {
mutex_unlock(&priv->reg_mutex);
return r;
}
r->id = idx;
r->gw_ip = ip;
r->pr.id = -1; /* We still need to allocate a rule in HW */
r->is_host_route = false;
err = rhltable_insert(&priv->routes, &r->linkage, route_ht_params);
if (err) {
pr_err("Could not insert new rule\n");
mutex_unlock(&priv->reg_mutex);
goto out_free;
}
set_bit(idx, priv->route_use_bm);
mutex_unlock(&priv->reg_mutex);
return r;
out_free:
kfree(r);
return NULL;
}
static struct rtl83xx_route *rtl83xx_host_route_alloc(struct rtl838x_switch_priv *priv, u32 ip)
{
struct rtl83xx_route *r;
int idx = 0, err;
mutex_lock(&priv->reg_mutex);
idx = find_first_zero_bit(priv->host_route_use_bm, MAX_HOST_ROUTES);
pr_debug("%s id: %d, ip %pI4\n", __func__, idx, &ip);
r = kzalloc(sizeof(*r), GFP_KERNEL);
if (!r) {
mutex_unlock(&priv->reg_mutex);
return r;
}
/* We require a unique route ID irrespective of whether it is a prefix or host
* route (on RTL93xx) as we use this ID to associate a DMAC and next-hop entry
*/
r->id = idx + MAX_ROUTES;
r->gw_ip = ip;
r->pr.id = -1; /* We still need to allocate a rule in HW */
r->is_host_route = true;
err = rhltable_insert(&priv->routes, &r->linkage, route_ht_params);
if (err) {
pr_err("Could not insert new rule\n");
mutex_unlock(&priv->reg_mutex);
goto out_free;
}
set_bit(idx, priv->host_route_use_bm);
mutex_unlock(&priv->reg_mutex);
return r;
out_free:
kfree(r);
return NULL;
}
static void rtl83xx_route_rm(struct rtl838x_switch_priv *priv, struct rtl83xx_route *r)
{
int id;
if (rhltable_remove(&priv->routes, &r->linkage, route_ht_params))
dev_warn(priv->dev, "Could not remove route\n");
if (r->is_host_route) {
id = priv->r->find_l3_slot(r, false);
pr_debug("%s: Got id for host route: %d\n", __func__, id);
r->attr.valid = false;
priv->r->host_route_write(id, r);
clear_bit(r->id - MAX_ROUTES, priv->host_route_use_bm);
} else {
/* If there is a HW representation of the route, delete it */
if (priv->r->route_lookup_hw) {
id = priv->r->route_lookup_hw(r);
pr_info("%s: Got id for prefix route: %d\n", __func__, id);
r->attr.valid = false;
priv->r->route_write(id, r);
}
clear_bit(r->id, priv->route_use_bm);
}
kfree(r);
}
static int rtldsa_fib4_check(struct rtl838x_switch_priv *priv,
struct fib_entry_notifier_info *info,
enum fib_event_type event)
{
struct net_device *ndev = fib_info_nh(info->fi, 0)->fib_nh_dev;
int vlan = is_vlan_dev(ndev) ? vlan_dev_vlan_id(ndev) : 0;
struct fib_nh *nh = fib_info_nh(info->fi, 0);
char gw_message[32] = "";
if (nh->fib_nh_gw4)
snprintf(gw_message, sizeof(gw_message), "via %pI4 ", &nh->fib_nh_gw4);
dev_info(priv->dev, "%s IPv4 route %pI4/%d %s(VLAN %d, MAC %pM)\n",
event == FIB_EVENT_ENTRY_ADD ? "add" : "delete",
&info->dst, info->dst_len, gw_message, vlan, ndev->dev_addr);
if ((info->type == RTN_BROADCAST) || ipv4_is_loopback(info->dst) || !info->dst) {
dev_warn(priv->dev, "skip loopback/broadcast addresses and default routes\n");
return -EINVAL;
}
return 0;
}
static int rtldsa_fib4_del(struct rtl838x_switch_priv *priv,
struct fib_entry_notifier_info *info)
{
struct fib_nh *nh = fib_info_nh(info->fi, 0);
struct rhlist_head *tmp, *list;
struct rtl83xx_route *route;
if (rtldsa_fib4_check(priv, info, FIB_EVENT_ENTRY_DEL))
return 0;
rcu_read_lock();
list = rhltable_lookup(&priv->routes, &nh->fib_nh_gw4, route_ht_params);
if (!list) {
rcu_read_unlock();
dev_err(priv->dev, "no such gateway: %pI4\n", &nh->fib_nh_gw4);
return -ENOENT;
}
rhl_for_each_entry_rcu(route, tmp, list, linkage) {
if (route->dst_ip == info->dst && route->prefix_len == info->dst_len) {
dev_info(priv->dev, "found a route with id %d, nh-id %d\n",
route->id, route->nh.id);
break;
}
}
rcu_read_unlock();
rtl83xx_l2_nexthop_rm(priv, &route->nh);
dev_info(priv->dev, "releasing packet counter %d\n", route->pr.packet_cntr);
set_bit(route->pr.packet_cntr, priv->packet_cntr_use_bm);
priv->r->pie_rule_rm(priv, &route->pr);
rtl83xx_route_rm(priv, route);
nh->fib_nh_flags &= ~RTNH_F_OFFLOAD;
return 0;
}
/* On the RTL93xx, an L3 termination endpoint MAC address on which the router waits
* for packets to be routed needs to be allocated.
*/
static int rtl83xx_alloc_router_mac(struct rtl838x_switch_priv *priv, u64 mac)
{
int free_mac = -1;
struct rtl93xx_rt_mac m;
mutex_lock(&priv->reg_mutex);
for (int i = 0; i < MAX_ROUTER_MACS; i++) {
priv->r->get_l3_router_mac(i, &m);
if (free_mac < 0 && !m.valid) {
free_mac = i;
continue;
}
if (m.valid && m.mac == mac) {
free_mac = i;
break;
}
}
if (free_mac < 0) {
pr_err("No free router MACs, cannot offload\n");
mutex_unlock(&priv->reg_mutex);
return -1;
}
m.valid = true;
m.mac = mac;
m.p_type = 0; /* An individual port, not a trunk port */
m.p_id = 0x3f; /* Listen on any port */
m.p_id_mask = 0;
m.vid = 0; /* Listen on any VLAN... */
m.vid_mask = 0; /* ... so mask needs to be 0 */
m.mac_mask = 0xffffffffffffULL; /* We want an exact match of the interface MAC */
m.action = L3_FORWARD; /* Route the packet */
priv->r->set_l3_router_mac(free_mac, &m);
mutex_unlock(&priv->reg_mutex);
return 0;
}
static int rtl83xx_alloc_egress_intf(struct rtl838x_switch_priv *priv, u64 mac, int vlan)
{
int free_mac = -1;
struct rtl838x_l3_intf intf;
u64 m;
mutex_lock(&priv->reg_mutex);
for (int i = 0; i < MAX_SMACS; i++) {
m = priv->r->get_l3_egress_mac(L3_EGRESS_DMACS + i);
if (free_mac < 0 && !m) {
free_mac = i;
continue;
}
if (m == mac) {
mutex_unlock(&priv->reg_mutex);
return i;
}
}
if (free_mac < 0) {
pr_err("No free egress interface, cannot offload\n");
return -1;
}
/* Set up default egress interface 1 */
intf.vid = vlan;
intf.smac_idx = free_mac;
intf.ip4_mtu_id = 1;
intf.ip6_mtu_id = 1;
intf.ttl_scope = 1; /* TTL */
intf.hl_scope = 1; /* Hop Limit */
intf.ip4_icmp_redirect = intf.ip6_icmp_redirect = 2; /* FORWARD */
intf.ip4_pbr_icmp_redirect = intf.ip6_pbr_icmp_redirect = 2; /* FORWARD; */
priv->r->set_l3_egress_intf(free_mac, &intf);
priv->r->set_l3_egress_mac(L3_EGRESS_DMACS + free_mac, mac);
mutex_unlock(&priv->reg_mutex);
return free_mac;
}
static int rtldsa_fib4_add(struct rtl838x_switch_priv *priv,
struct fib_entry_notifier_info *info)
{
struct net_device *ndev = fib_info_nh(info->fi, 0)->fib_nh_dev;
int vlan = is_vlan_dev(ndev) ? vlan_dev_vlan_id(ndev) : 0;
struct fib_nh *nh = fib_info_nh(info->fi, 0);
struct rtl83xx_route *route;
int port;
if (rtldsa_fib4_check(priv, info, FIB_EVENT_ENTRY_ADD))
return 0;
port = rtl83xx_port_dev_lower_find(ndev, priv);
if (port < 0) {
dev_err(priv->dev, "lower interface %s not found\n", ndev->name);
return -ENODEV;
}
/* Allocate route or host-route entry (if hardware supports this) */
if (info->dst_len == 32 && priv->r->host_route_write)
route = rtl83xx_host_route_alloc(priv, nh->fib_nh_gw4);
else
route = rtl83xx_route_alloc(priv, nh->fib_nh_gw4);
if (route)
dev_info(priv->dev, "route hashtable extended for gw %pI4\n", &nh->fib_nh_gw4);
else {
dev_err(priv->dev, "could not extend route hashtable for gw %pI4\n", &nh->fib_nh_gw4);
return -ENOSPC;
}
route->dst_ip = info->dst;
route->prefix_len = info->dst_len;
route->nh.rvid = vlan;
if (priv->r->set_l3_router_mac) {
u64 mac = ether_addr_to_u64(ndev->dev_addr);
pr_debug("Local route and router MAC %pM\n", ndev->dev_addr);
if (rtl83xx_alloc_router_mac(priv, mac))
goto out_free_rt;
/* vid = 0: Do not care about VID */
route->nh.if_id = rtl83xx_alloc_egress_intf(priv, mac, vlan);
if (route->nh.if_id < 0)
goto out_free_rmac;
if (!nh->fib_nh_gw4) {
int slot;
route->nh.mac = mac;
route->nh.port = priv->r->port_ignore;
route->attr.valid = true;
route->attr.action = ROUTE_ACT_TRAP2CPU;
route->attr.type = 0;
slot = priv->r->find_l3_slot(route, false);
pr_debug("%s: Got slot for route: %d\n", __func__, slot);
priv->r->host_route_write(slot, route);
}
}
/* We need to resolve the mac address of the GW */
if (nh->fib_nh_gw4)
rtl83xx_port_ipv4_resolve(priv, ndev, nh->fib_nh_gw4);
nh->fib_nh_flags |= RTNH_F_OFFLOAD;
return 0;
out_free_rmac:
out_free_rt:
return 0;
}
static int rtl83xx_fib6_add(struct rtl838x_switch_priv *priv,
struct fib6_entry_notifier_info *info)
{
pr_debug("In %s\n", __func__);
/* nh->fib_nh_flags |= RTNH_F_OFFLOAD; */
return 0;
}
struct net_event_work {
struct work_struct work;
struct rtl838x_switch_priv *priv;
u64 mac;
u32 gw_addr;
};
static void rtl83xx_net_event_work_do(struct work_struct *work)
{
struct net_event_work *net_work =
container_of(work, struct net_event_work, work);
struct rtl838x_switch_priv *priv = net_work->priv;
rtl83xx_l3_nexthop_update(priv, net_work->gw_addr, net_work->mac);
kfree(net_work);
}
static int rtl83xx_netevent_event(struct notifier_block *this,
unsigned long event, void *ptr)
{
struct rtl838x_switch_priv *priv;
struct net_device *dev;
struct neighbour *n = ptr;
int err, port;
struct net_event_work *net_work;
priv = container_of(this, struct rtl838x_switch_priv, ne_nb);
switch (event) {
case NETEVENT_NEIGH_UPDATE:
/* ignore events for HW with missing L3 offloading implementation */
if (!priv->r->l3_setup)
return NOTIFY_DONE;
if (n->tbl != &arp_tbl)
return NOTIFY_DONE;
dev = n->dev;
port = rtl83xx_port_dev_lower_find(dev, priv);
if (port < 0 || !(n->nud_state & NUD_VALID)) {
pr_debug("%s: Neigbour invalid, not updating\n", __func__);
return NOTIFY_DONE;
}
net_work = kzalloc(sizeof(*net_work), GFP_ATOMIC);
if (!net_work)
return NOTIFY_BAD;
INIT_WORK(&net_work->work, rtl83xx_net_event_work_do);
net_work->priv = priv;
net_work->mac = ether_addr_to_u64(n->ha);
net_work->gw_addr = *(__be32 *)n->primary_key;
pr_debug("%s: updating neighbour on port %d, mac %016llx\n",
__func__, port, net_work->mac);
queue_work(priv->wq, &net_work->work);
if (err)
netdev_warn(dev, "failed to handle neigh update (err %d)\n", err);
break;
}
return NOTIFY_DONE;
}
struct rtl83xx_fib_event_work {
struct work_struct work;
union {
struct fib_entry_notifier_info fen_info;
struct fib6_entry_notifier_info fen6_info;
struct fib_rule_notifier_info fr_info;
};
struct rtl838x_switch_priv *priv;
bool is_fib6;
unsigned long event;
};
static void rtl83xx_fib_event_work_do(struct work_struct *work)
{
struct rtl83xx_fib_event_work *fib_work =
container_of(work, struct rtl83xx_fib_event_work, work);
struct rtl838x_switch_priv *priv = fib_work->priv;
struct fib_rule *rule;
int err;
/* Protect internal structures from changes */
rtnl_lock();
pr_debug("%s: doing work, event %ld\n", __func__, fib_work->event);
switch (fib_work->event) {
case FIB_EVENT_ENTRY_ADD:
case FIB_EVENT_ENTRY_REPLACE:
case FIB_EVENT_ENTRY_APPEND:
if (fib_work->is_fib6)
err = rtl83xx_fib6_add(priv, &fib_work->fen6_info);
else
err = rtldsa_fib4_add(priv, &fib_work->fen_info);
if (err)
dev_err(priv->dev, "fib_add() failed\n");
fib_info_put(fib_work->fen_info.fi);
break;
case FIB_EVENT_ENTRY_DEL:
err = rtldsa_fib4_del(priv, &fib_work->fen_info);
if (err)
dev_err(priv->dev, "fib_del() failed\n");
fib_info_put(fib_work->fen_info.fi);
break;
case FIB_EVENT_RULE_ADD:
case FIB_EVENT_RULE_DEL:
rule = fib_work->fr_info.rule;
if (!fib4_rule_default(rule))
pr_err("%s: FIB4 default rule failed\n", __func__);
fib_rule_put(rule);
break;
}
rtnl_unlock();
kfree(fib_work);
}
/* Called with rcu_read_lock() */
static int rtl83xx_fib_event(struct notifier_block *this, unsigned long event, void *ptr)
{
struct fib_notifier_info *info = ptr;
struct rtl838x_switch_priv *priv;
struct rtl83xx_fib_event_work *fib_work;
if ((info->family != AF_INET && info->family != AF_INET6 &&
info->family != RTNL_FAMILY_IPMR &&
info->family != RTNL_FAMILY_IP6MR))
return NOTIFY_DONE;
priv = container_of(this, struct rtl838x_switch_priv, fib_nb);
/* ignore FIB events for HW with missing L3 offloading implementation */
if (!priv->r->l3_setup)
return NOTIFY_DONE;
fib_work = kzalloc(sizeof(*fib_work), GFP_ATOMIC);
if (!fib_work)
return NOTIFY_BAD;
INIT_WORK(&fib_work->work, rtl83xx_fib_event_work_do);
fib_work->priv = priv;
fib_work->event = event;
fib_work->is_fib6 = false;
switch (event) {
case FIB_EVENT_ENTRY_ADD:
case FIB_EVENT_ENTRY_REPLACE:
case FIB_EVENT_ENTRY_APPEND:
case FIB_EVENT_ENTRY_DEL:
pr_debug("%s: FIB_ENTRY ADD/DEL, event %ld\n", __func__, event);
if (info->family == AF_INET) {
struct fib_entry_notifier_info *fen_info = ptr;
if (fen_info->fi->fib_nh_is_v6) {
NL_SET_ERR_MSG_MOD(info->extack,
"IPv6 gateway with IPv4 route is not supported");
kfree(fib_work);
return notifier_from_errno(-EINVAL);
}
memcpy(&fib_work->fen_info, ptr, sizeof(fib_work->fen_info));
/* Take referece on fib_info to prevent it from being
* freed while work is queued. Release it afterwards.
*/
fib_info_hold(fib_work->fen_info.fi);
} else if (info->family == AF_INET6) {
//struct fib6_entry_notifier_info *fen6_info = ptr;
pr_warn("%s: FIB_RULE ADD/DEL for IPv6 not supported\n", __func__);
kfree(fib_work);
return NOTIFY_DONE;
}
break;
case FIB_EVENT_RULE_ADD:
case FIB_EVENT_RULE_DEL:
pr_debug("%s: FIB_RULE ADD/DEL, event: %ld\n", __func__, event);
memcpy(&fib_work->fr_info, ptr, sizeof(fib_work->fr_info));
fib_rule_get(fib_work->fr_info.rule);
break;
}
queue_work(priv->wq, &fib_work->work);
return NOTIFY_DONE;
}
static irqreturn_t rtldsa_switch_irq(int irq, void *dev_id)
{
struct rtl838x_switch_priv *priv;
struct dsa_switch *ds = dev_id;
u64 link, ports;
priv = ds->priv;
ports = priv->r->get_port_reg_le(priv->r->isr_port_link_sts_chg);
priv->r->set_port_reg_le(ports, priv->r->isr_port_link_sts_chg);
/* read latched */
link = priv->r->get_port_reg_le(priv->r->mac_link_sts);
link = priv->r->get_port_reg_le(priv->r->mac_link_sts);
for (int port = 0; port < priv->r->cpu_port; port++)
if (ports & BIT_ULL(port))
dsa_port_phylink_mac_change(ds, port, link & BIT_ULL(port));
return IRQ_HANDLED;
}
/*
* TODO: This check is usually built into the DSA initialization functions. After carving
* out the mdio driver from the ethernet driver, there are two drivers that must be loaded
* before the DSA setup can start. This driver has severe issues with handling of deferred
* probing. For now provide this function for early dependency checks.
*/
static int rtldsa_ethernet_loaded(struct platform_device *pdev)
{
struct platform_device *eth_pdev;
struct device_node *port_np;
struct device_node *eth_np;
int ret = -EPROBE_DEFER;
for_each_node_with_property(port_np, "ethernet") {
eth_np = of_parse_phandle(port_np, "ethernet", 0);
if (!eth_np)
continue;
eth_pdev = of_find_device_by_node(eth_np);
of_node_put(eth_np);
if (!eth_pdev)
continue;
if (eth_pdev->dev.driver)
ret = 0;
put_device(&eth_pdev->dev);
}
return ret;
}
static int rtl83xx_sw_probe(struct platform_device *pdev)
{
struct rtl838x_switch_priv *priv;
struct device *dev = &pdev->dev;
const struct rtldsa_config *r;
u64 bpdu_mask;
int err = 0;
pr_debug("Probing RTL838X switch device\n");
if (!pdev->dev.of_node) {
dev_err(dev, "No DT found\n");
return -EINVAL;
}
if (rtldsa_phys_load_deferred())
return -EPROBE_DEFER;
err = rtldsa_ethernet_loaded(pdev);
if (err)
return err;
/* Initialize access to RTL switch tables */
rtl_table_init();
r = device_get_match_data(&pdev->dev);
priv = devm_kzalloc(dev, struct_size(priv, msts, r->n_mst - 1), GFP_KERNEL);
if (!priv)
return -ENOMEM;
priv->r = r;
priv->ds = devm_kzalloc(dev, sizeof(*priv->ds), GFP_KERNEL);
if (!priv->ds)
return -ENOMEM;
priv->ds->dev = dev;
priv->ds->priv = priv;
priv->ds->needs_standalone_vlan_filtering = true;
priv->ds->ops = priv->r->switch_ops;
priv->ds->phylink_mac_ops = priv->r->phylink_mac_ops;
priv->ds->num_lag_ids = priv->r->num_lag_ids;
priv->ds->num_ports = priv->r->cpu_port + 1;
priv->dev = dev;
dev_set_drvdata(dev, priv);
err = devm_mutex_init(dev, &priv->reg_mutex);
if (err)
return err;
err = devm_mutex_init(dev, &priv->counters_lock);
if (err)
return err;
priv->family_id = soc_info.family;
sw_w32(0, priv->r->spanning_tree_ctrl);
priv->irq_mask = GENMASK_ULL(priv->r->cpu_port - 1, 0);
err = rtl83xx_mdio_probe(priv);
if (err) {
/* Probing fails the 1st time because of missing ethernet driver
* initialization. Use this to disable traffic in case the bootloader left if on
*/
return err;
}
priv->wq = create_singlethread_workqueue("rtl83xx");
if (!priv->wq) {
dev_err(dev, "Error creating workqueue: %d\n", err);
return -ENOMEM;
}
err = dsa_register_switch(priv->ds);
if (err) {
dev_err(dev, "Error registering switch: %d\n", err);
goto err_register_switch;
}
/* dsa_to_port returns dsa_port from the port list in
* dsa_switch_tree, the tree is built when the switch
* is registered by dsa_register_switch
*/
for (int i = 0; i <= priv->r->cpu_port; i++)
priv->ports[i].dp = dsa_to_port(priv->ds, i);
/* Enable link and media change interrupts. Are the SERDES masks needed? */
sw_w32_mask(0, 3, priv->r->isr_glb_src);
priv->r->set_port_reg_le(priv->irq_mask, priv->r->isr_port_link_sts_chg);
priv->r->set_port_reg_le(priv->irq_mask, priv->r->imr_port_link_sts_chg);
priv->link_state_irq = platform_get_irq(pdev, 0);
pr_info("LINK state irq: %d\n", priv->link_state_irq);
err = request_irq(priv->link_state_irq, rtldsa_switch_irq,
IRQF_SHARED, "rtldsa-link-state", priv->ds);
if (err) {
dev_err(dev, "Error setting up switch interrupt.\n");
/* Need to free allocated switch here */
}
/* Enable interrupts for switch, on RTL931x, the IRQ is always on globally */
if (soc_info.family != RTL9310_FAMILY_ID)
sw_w32(0x1, priv->r->imr_glb);
rtl83xx_get_l2aging(priv);
if (priv->r->qos_init)
priv->r->qos_init(priv);
if (priv->r->l3_setup)
priv->r->l3_setup(priv);
/* Clear all destination ports for mirror groups */
for (int i = 0; i < 4; i++)
priv->mirror_group_ports[i] = -1;
/* Initialize hash table for L3 routing */
rhltable_init(&priv->routes, &route_ht_params);
/* Register netevent notifier callback to catch notifications about neighboring
* changes to update nexthop entries for L3 routing.
*/
priv->ne_nb.notifier_call = rtl83xx_netevent_event;
if (register_netevent_notifier(&priv->ne_nb)) {
priv->ne_nb.notifier_call = NULL;
dev_err(dev, "Failed to register netevent notifier\n");
goto err_register_ne_nb;
}
priv->fib_nb.notifier_call = rtl83xx_fib_event;
/* Register Forwarding Information Base notifier to offload routes where
* possible
* Only FIBs pointing to our own netdevs are programmed into
* the device, so no need to pass a callback.
*/
err = register_fib_notifier(&init_net, &priv->fib_nb, NULL, NULL);
if (err)
goto err_register_fib_nb;
/* TODO: put this into l2_setup() */
switch (soc_info.family) {
default:
/* Flood BPDUs to all ports including cpu-port */
bpdu_mask = soc_info.family == RTL8380_FAMILY_ID ? 0x1FFFFFFF : 0x1FFFFFFFFFFFFF;
priv->r->set_port_reg_be(bpdu_mask, priv->r->rma_bpdu_fld_pmask);
/* TRAP 802.1X frames (EAPOL) to the CPU-Port, bypass STP and VLANs */
sw_w32(7, priv->r->spcl_trap_eapol_ctrl);
rtl838x_dbgfs_init(priv);
break;
case RTL9300_FAMILY_ID:
case RTL9310_FAMILY_ID:
rtl930x_dbgfs_init(priv);
break;
}
if (priv->r->lag_switch_init)
priv->r->lag_switch_init(priv);
return 0;
err_register_fib_nb:
unregister_netevent_notifier(&priv->ne_nb);
err_register_ne_nb:
dsa_switch_shutdown(priv->ds);
err_register_switch:
destroy_workqueue(priv->wq);
return err;
}
void rtldsa_93xx_lag_switch_init(struct rtl838x_switch_priv *priv)
{
u32 trk_ctrlmask = 0;
u32 algomask;
trk_ctrlmask |= RTL93XX_TRK_CTRL_NON_TMN_TUNNEL_HASH_SEL;
trk_ctrlmask |= RTL93XX_TRK_CTRL_TRK_STAND_ALONE_MODE;
trk_ctrlmask |= RTL93XX_TRK_CTRL_LOCAL_FIRST;
sw_w32(trk_ctrlmask, priv->r->trk_ctrl);
/* Setup NETDEV_LAG_HASH_L2 on slot 0 */
algomask = TRUNK_DISTRIBUTION_ALGO_SMAC_BIT |
TRUNK_DISTRIBUTION_ALGO_DMAC_BIT;
priv->r->lag_set_distribution_algorithm(priv, 0, RTL93XX_HASH_MASK_INDEX_L2, algomask);
/* Setup NETDEV_LAG_HASH_L23 on slot 1 */
algomask = TRUNK_DISTRIBUTION_ALGO_SMAC_BIT |
TRUNK_DISTRIBUTION_ALGO_DMAC_BIT |
TRUNK_DISTRIBUTION_ALGO_SIP_BIT |
TRUNK_DISTRIBUTION_ALGO_DIP_BIT;
priv->r->lag_set_distribution_algorithm(priv, 0, RTL93XX_HASH_MASK_INDEX_L23, algomask);
}
static void rtl83xx_sw_remove(struct platform_device *pdev)
{
struct rtl838x_switch_priv *priv = platform_get_drvdata(pdev);
if (!priv)
return;
/* TODO: */
pr_debug("Removing platform driver for rtl83xx-sw\n");
/* unregister notifiers which will create workqueue entries with
* references to the switch structures. Also stop self-arming delayed
* work items to avoid them still accessing the DSA structures
* when they are getting shut down.
*/
unregister_fib_notifier(&init_net, &priv->fib_nb);
unregister_netevent_notifier(&priv->ne_nb);
cancel_delayed_work_sync(&priv->counters_work);
dsa_switch_shutdown(priv->ds);
destroy_workqueue(priv->wq);
dev_set_drvdata(&pdev->dev, NULL);
}
static const struct of_device_id rtl83xx_switch_of_ids[] = {
{
.compatible = "realtek,rtl8380-switch",
.data = &rtldsa_838x_cfg,
},
{
.compatible = "realtek,rtl8392-switch",
.data = &rtldsa_839x_cfg,
},
{
.compatible = "realtek,rtl9301-switch",
.data = &rtldsa_930x_cfg,
},
{
.compatible = "realtek,rtl9311-switch",
.data = &rtldsa_931x_cfg,
},
{ /* sentinel */ }
};
MODULE_DEVICE_TABLE(of, rtl83xx_switch_of_ids);
static struct platform_driver rtl83xx_switch_driver = {
.probe = rtl83xx_sw_probe,
.remove = rtl83xx_sw_remove,
.driver = {
.name = "rtl83xx-switch",
.pm = NULL,
.of_match_table = rtl83xx_switch_of_ids,
},
};
module_platform_driver(rtl83xx_switch_driver);
MODULE_AUTHOR("B. Koblitz");
MODULE_DESCRIPTION("RTL83XX SoC Switch Driver");
MODULE_LICENSE("GPL");