Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[tunnelmgrd]: Warm boot support #2166

Merged
merged 3 commits into from
Mar 17, 2022
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
46 changes: 44 additions & 2 deletions cfgmgr/tunnelmgr.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@
#include "tokenize.h"
#include "shellcmd.h"
#include "exec.h"
#include "warm_restart.h"

using namespace std;
using namespace swss;
Expand Down Expand Up @@ -107,7 +108,8 @@ static int cmdIpTunnelRouteDel(const std::string& pfx, std::string & res)
TunnelMgr::TunnelMgr(DBConnector *cfgDb, DBConnector *appDb, const std::vector<std::string> &tableNames) :
Orch(cfgDb, tableNames),
m_appIpInIpTunnelTable(appDb, APP_TUNNEL_DECAP_TABLE_NAME),
m_cfgPeerTable(cfgDb, CFG_PEER_SWITCH_TABLE_NAME)
m_cfgPeerTable(cfgDb, CFG_PEER_SWITCH_TABLE_NAME),
m_cfgTunnelTable(cfgDb, CFG_TUNNEL_TABLE_NAME)
{
std::vector<string> peer_keys;
m_cfgPeerTable.getKeys(peer_keys);
Expand All @@ -126,6 +128,23 @@ TunnelMgr::TunnelMgr(DBConnector *cfgDb, DBConnector *appDb, const std::vector<s
}
}
}

if (WarmStart::isWarmStart())
{
std::vector<string> tunnel_keys;
m_cfgTunnelTable.getKeys(tunnel_keys);

for (auto tunnel: tunnel_keys)
{
m_tunnelReplay.insert(tunnel);
}
if (m_tunnelReplay.empty())
{
finalizeWarmReboot();
}

}


auto consumerStateTable = new swss::ConsumerStateTable(appDb, APP_TUNNEL_ROUTE_TABLE_NAME,
TableConsumable::DEFAULT_POP_BATCH_SIZE, default_orch_pri);
Expand Down Expand Up @@ -191,6 +210,11 @@ void TunnelMgr::doTask(Consumer &consumer)
++it;
}
}

if (!replayDone && m_tunnelReplay.empty() && WarmStart::isWarmStart())
{
finalizeWarmReboot();
}
}

bool TunnelMgr::doTunnelTask(const KeyOpFieldsValuesTuple & t)
Expand Down Expand Up @@ -230,8 +254,16 @@ bool TunnelMgr::doTunnelTask(const KeyOpFieldsValuesTuple & t)
SWSS_LOG_NOTICE("Peer/Remote IP not configured");
}

m_appIpInIpTunnelTable.set(tunnelName, kfvFieldsValues(t));
/* If the tunnel is already in hardware (i.e. present in the replay),
* don't try to create it again since it will cause an OA crash
* (warmboot case)
*/
if (m_tunnelReplay.find(tunnelName) == m_tunnelReplay.end())
{
m_appIpInIpTunnelTable.set(tunnelName, kfvFieldsValues(t));
}
}
m_tunnelReplay.erase(tunnelName);
m_tunnelCache[tunnelName] = tunInfo;
}
else
Expand Down Expand Up @@ -356,3 +388,13 @@ bool TunnelMgr::configIpTunnel(const TunnelInfo& tunInfo)

return true;
}


void TunnelMgr::finalizeWarmReboot()
{
replayDone = true;
WarmStart::setWarmStartState("tunnelmgrd", WarmStart::REPLAYED);
SWSS_LOG_NOTICE("tunnelmgrd warmstart state set to REPLAYED");
WarmStart::setWarmStartState("tunnelmgrd", WarmStart::RECONCILED);
SWSS_LOG_NOTICE("tunnelmgrd warmstart state set to RECONCILED");
}
8 changes: 8 additions & 0 deletions cfgmgr/tunnelmgr.h
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,8 @@
#include "producerstatetable.h"
#include "orch.h"

#include <set>

namespace swss {

struct TunnelInfo
Expand All @@ -28,12 +30,18 @@ class TunnelMgr : public Orch

bool configIpTunnel(const TunnelInfo& info);

void finalizeWarmReboot();

ProducerStateTable m_appIpInIpTunnelTable;
Table m_cfgPeerTable;
Table m_cfgTunnelTable;

std::map<std::string, TunnelInfo > m_tunnelCache;
std::map<std::string, IpPrefix> m_intfCache;
std::string m_peerIp;

std::set<std::string> m_tunnelReplay;
bool replayDone = false;
};

}
4 changes: 4 additions & 0 deletions cfgmgr/tunnelmgrd.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -11,6 +11,7 @@
#include "exec.h"
#include "schema.h"
#include "tunnelmgr.h"
#include "warm_restart.h"

using namespace std;
using namespace swss;
Expand Down Expand Up @@ -54,6 +55,9 @@ int main(int argc, char **argv)
DBConnector cfgDb("CONFIG_DB", 0);
DBConnector appDb("APPL_DB", 0);

WarmStart::initialize("tunnelmgrd", "swss");
WarmStart::checkWarmStart("tunnelmgrd", "swss");

TunnelMgr tunnelmgr(&cfgDb, &appDb, cfgTunTables);

std::vector<Orch *> cfgOrchList = {&tunnelmgr};
Expand Down
29 changes: 29 additions & 0 deletions tests/test_warm_reboot.py
Original file line number Diff line number Diff line change
Expand Up @@ -2365,6 +2365,35 @@ def test_EverflowWarmReboot(self, dvs, dvs_acl):
dvs.start_swss()
dvs.check_swss_ready()

def test_TunnelMgrdWarmRestart(self, dvs):
tunnel_name = "MuxTunnel0"
tunnel_table = "TUNNEL_DECAP_TABLE"
tunnel_params = {
"tunnel_type": "IPINIP",
"dst_ip": "10.1.0.32",
"dscp_mode": "uniform",
"ecn_mode": "standard",
"ttl_mode": "pipe"
}

pubsub = dvs.SubscribeAppDbObject(tunnel_table)

dvs.runcmd("config warm_restart enable swss")
config_db = dvs.get_config_db()
config_db.create_entry("TUNNEL", tunnel_name, tunnel_params)

app_db = dvs.get_app_db()
app_db.wait_for_matching_keys(tunnel_table, [tunnel_name])

nadd, ndel = dvs.CountSubscribedObjects(pubsub)
assert nadd == len(tunnel_params)
assert ndel == 1 # Expect 1 deletion as part of table creation

dvs.runcmd("supervisorctl restart tunnelmgrd")
dvs.check_services_ready()
nadd, ndel = dvs.CountSubscribedObjects(pubsub)
assert nadd == 0
assert ndel == 0

# Add Dummy always-pass test at end as workaroud
# for issue when Flaky fail on final test it invokes module tear-down before retrying
Expand Down