taurus-node/tests/p2p_high_latency_test.py at develop · SynthWave-Systems/taurus-node

executable file
113 lines (101 loc) · 4.99 KB
#!/usr/bin/env python3
from testUtils import Utils, WaitSpec
from Cluster import Cluster
from WalletMgr import WalletMgr
from TestHelper import TestHelper
import signal
import platform
import subprocess
import time
###############################################################
# p2p connection in high latency network for one producer and one syning node cluster.
#   This test simulates p2p connections in high latency network. The test case is such that there are one producer
#   and one syncing node and a latency of 1100ms is introduced to their p2p connection.
#   The expected behavior is that producer recognize the net latency and do not send lib catchup to syncing node. 
#   As syncing node is always behind, therefore sending lib catchup is useless as producer/peer node gets caught into infinite
#   loop of sending lib catch up to syncing node.
###############################################################
def readlogs(node_num, net_latency):
    filename = 'var/lib/node_0{}/stderr.txt'.format(node_num)
    f = subprocess.Popen(['tail','-F',filename],\
        stdout=subprocess.PIPE,stderr=subprocess.PIPE)
    latRegex = re.compile(r'\d+ms')
    t_end = time.time() + 80 # cluster runs for 80 seconds and and logs are being processed
    while time.time() <= t_end:
        line = f.stdout.readline().decode("utf-8")
        print(line)
        if 'info' in line and 'Catching up with chain, our last req is ' in line:
            Utils.Print("Syncing node is catching up with chain, however it should not due to net latency")
            return False
        if 'debug' in line and 'Network latency' in line and float(latRegex.search(line).group()[:-2]) < 0.8 * net_latency:
            Utils.Print("Network latency is lower than expected.")
            return False
    return True
def exec(cmd):
    process = subprocess.Popen(cmd, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
    out, err = process.communicate()
    process.wait()
    process.stdout.close()
    process.stderr.close()
    return err, process.returncode
Print=Utils.Print
args = TestHelper.parse_args({"--dump-error-details","--keep-logs","-v","--leave-running","--clean-run"})
Utils.Debug=args.v
producers=1
syncingNodes=1
totalNodes=producers+syncingNodes
cluster=Cluster(walletd=True)
dumpErrorDetails=args.dump_error_details
keepLogs=args.keep_logs
dontKill=args.leave_running
killAll=args.clean_run
testSuccessful=False
killEosInstances=not dontKill
specificExtraNodeosArgs={}
producerNodeId=0
syncingNodeId=1
specificExtraNodeosArgs[producerNodeId]=" --p2p-listen-endpoint 0.0.0.0:{}".format(9876+producerNodeId)
specificExtraNodeosArgs[syncingNodeId]="--p2p-peer-address 0.0.0.0:{}".format(9876+producerNodeId)
    TestHelper.printSystemInfo("BEGIN")
    cluster.killall(allInstances=killAll)
    cluster.cleanup()
    traceNodeosArgs=" --plugin eosio::trace_api_plugin --trace-no-abis --plugin eosio::producer_plugin --produce-time-offset-us 0 --last-block-time-offset-us 0 --cpu-effort-percent 100 \
        --last-block-cpu-effort-percent 100 --producer-threads 1 --plugin eosio::net_plugin --net-threads 1"
    if cluster.launch(pnodes=1, totalNodes=totalNodes, totalProducers=1, useBiosBootFile=False, specificExtraNodeosArgs=specificExtraNodeosArgs, extraNodeosArgs=traceNodeosArgs) is False:
        Utils.cmdError("launcher")
        Utils.errorExit("Failed to stand up eos cluster.")
    cluster.waitOnClusterSync(blockAdvancing=5)
    Utils.Print("Cluster in Sync")
    cluster.biosNode.kill(signal.SIGTERM)   
    Utils.Print("Bios node killed")
    latency = 1100 # 1100 millisecond
    # adding latency to all inbound and outbound traffic 
    Utils.Print( "adding {}ms latency to network.".format(latency) )
    if platform.system() == 'Darwin':
        cmd = 'sudo dnctl pipe 1 config delay {} && \
            echo "dummynet out proto tcp from any to any pipe 1" | sudo pfctl -f - && \
            sudo pfctl -e'.format(latency)
        cmd = 'tc qdisc add dev lo root netem delay {}ms'.format(latency)
    err, ReturnCode = exec(cmd)
    if ReturnCode != 0:
        print(err.decode("utf-8")) # print error details of network slowdown initialization commands 
        Utils.errorExit("failed to initialize network latency, exited with error code {}".format(ReturnCode))   
    # processing logs to make sure syncing node doesn't get into lib catch up mode.
    testSuccessful=readlogs(syncingNodeId, latency)
    if platform.system() == 'Darwin':
        cmd = 'sudo pfctl -f /etc/pf.conf && \
            sudo dnctl -q flush && sudo pfctl -d'
        cmd = 'tc qdisc del dev lo root netem'
    err, ReturnCode = exec(cmd)
    if ReturnCode != 0:
        print(err.decode("utf-8")) # print error details of network slowdown termination commands 
        Utils.errorExit("failed to remove network latency, exited with error code {}".format(ReturnCode)) 
    TestHelper.shutdown(cluster, None, testSuccessful, killEosInstances, False, keepLogs, killAll, dumpErrorDetails)
exitCode = 0 if testSuccessful else 1
exit(exitCode)
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Uh oh!

FilesExpand file tree

p2p_high_latency_test.py

Latest commit

History

p2p_high_latency_test.py

File metadata and controls