summer 2020 version of server_bench, take 1

2020-08-05 16:51:36 -04:00 · 2020-08-05 16:51:36 -04:00 · fac1440934
commit fac1440934
parent 3baf28ccae
1 changed files with 465 additions and 0 deletions
--- a/tests/server_bench.py
+++ b/tests/server_bench.py
@ -0,0 +1,465 @@
 #!/usr/bin/env python3
 #
 # Benchmark an HTTP server with wrk
 #
 # @author gback; Spring 2016, Spring 2018, Summer 2002
 #
 import getopt, sys, os, subprocess, signal, re, json, resource, time, socket, atexit
 from collections import namedtuple
 from http.client import HTTPConnection, OK
 runconfig = namedtuple(
    "runconfig",
    [
        "name",  # name of configuration
        "nthreads",  # number of threads
        "nconnections",  # number of conn per thread
        "timeout",  # number of conn per thread
        "window",  # number of conn per thread
        "overlap",  # number of conn per thread
        "description",  # description
        "path",  # target path to be retrieved
        "duration",
    ],
 )  # duration (with unit as string, i.e. "1s")
 VERSION = "1.1"
 server_exe = "./server"
 server_root = "_serverroot_"
 wrk_exe = "/home/courses/cs3214/bin/wrk"
 nthreads = 64
 # tests will be run in this order
 tests = [
    runconfig(
        name="login40",
        timeout="1s",
        nthreads=40,
        nconnections=40,
        duration="10s",
        path="/api/login",
        description="""
    Can your server handle 40 parallel connections request /api/login?
    """,
        window=500,
        overlap=250,
    ),
    runconfig(
        name="login500",
        timeout="5s",
        nthreads=nthreads,
        nconnections=500,
        duration="10s",
        path="/api/login",
        description="""
    Using 500 connections, each of which is repeatedly requesting /api/login (~2bytes in
    HTTP body).  We believe this should be enough to make the server CPU bound.
    """,
        window=1000,
        overlap=500,
    ),
    runconfig(
        name="login10k",
        timeout="5s",
        nthreads=nthreads,
        nconnections=10000,
        duration="30s",
        path="/api/login",
        description="""
    Handling 10k simultaneous connections has been a target of scalability since 1999:
    http://www.kegel.com/c10k.html
    Can your server handle it?
    """,
        window=1000,
        overlap=500,
    ),
    runconfig(
        name="wwwcsvt100",
        timeout="5s",
        nthreads=nthreads,
        nconnections=100,
        duration="20s",
        path="/www.cs.vt.edu-20200417.html",
        description="""
    The home page of the CS Department, as of 4/17/2020, is about 66KB large (not counting embedded objects).
    If 100 clients accessed it simultaneously, how much throughput could they expect?
    """,
        window=1000,
        overlap=500,
    ),
    runconfig(
        name="doom100",
        timeout="10s",
        nthreads=40,
        nconnections=40,
        duration="20s",
        path="/large",
        description="""
    According to https://mobiforge.com/research-analysis/the-web-is-doom the combined size of all
    objects that make an average web page was 2,250kBytes as of April 2016. If these were transferred
    all in a single objects, how much throughput would you get?
    This should max out the 10Gbps Ethernet links, even with only 40 connections.
    """,
        window=500,
        overlap=250,
    ),
 ]
 testsbyname = dict((c.name, c) for c in tests)
 teststorun = map(lambda t: t.name, tests)
 def listtests():
    for test in tests:
        print(
            """
 Test:           %s
 Connections:    %d
 Duration:       %s
 Path:           %s
 Description:    %s
 """
            % (test.name, test.nconnections, test.duration, test.path, test.description)
        )
 script_dir = "/".join(os.path.realpath(__file__).split("/")[:-1])
 if script_dir == "":
    script_dir = "."
 script_dir = os.path.realpath(script_dir)
 def usage():
    print(
        """
 Usage: %s [-hv] [-l] [-s server] [-R serverroot] [-t test1,test2,...] [url]
   -h                     display this help
   -v                     run verbose
   -s                     path to server executable, default %s
   -R server_root         path to server root, default %s
   -t test                run just the tests specified
   -l                     list available tests with their descriptions
   -i                     activate ink tracing tool
   url                    URL where your server can be reached, i.e.
                            http://hickory.rlogin:12306/
 This script must be started on two different rlogin nodes.
 On the first node, run it without a URL to start the server.
 Then run it on a second node with the URL printed out by the
 first run.
    """
        % (sys.argv[0], server_exe, server_root)
    )
 try:
    opts, args = getopt.getopt(sys.argv[1:], "ihvs:R:t:l", ["help", "verbose"])
 except getopt.GetoptError as err:
    print(str(err))
    usage()
    sys.exit(2)
 verbose = False
 hostname = socket.gethostname()
 useInk = False
 for opt, arg in opts:
    if opt == "-h":
        usage()
        sys.exit(0)
    if opt == "-v":
        verbose = True
    elif opt == "-i":
        useInk = True
    elif opt == "-s":
        server_exe = arg
    elif opt == "-R":
        server_root = arg
    elif opt == "-l":
        listtests()
        sys.exit(0)
    elif opt == "-t":
        teststorun = arg.split(",")
    else:
        assert False, "unhandled option"
 def raise_fd_limit():
    print("I will now try to raise the file descriptor limit")
    soft, hard = resource.getrlimit(resource.RLIMIT_NOFILE)
    resource.setrlimit(resource.RLIMIT_NOFILE, (hard, hard))
    soft, hard = resource.getrlimit(resource.RLIMIT_NOFILE)
    print("Your server process can open %d file descriptors simultaneously." % soft)
 def raise_thread_limit():
    print("I will now try to raise the max number of threads you can spawn")
    soft, hard = resource.getrlimit(resource.RLIMIT_NPROC)
    resource.setrlimit(resource.RLIMIT_NPROC, (hard, hard))
    soft, hard = resource.getrlimit(resource.RLIMIT_NPROC)
    print("Your server process can spawn %d threads simultaneously." % soft)
 #
 # Start the server.
 #
 def start_server(root_dir):
    print("I will now prepare your server for benchmarking.")
    if not os.access(server_exe, os.X_OK):
        print("Did not find server executable: %s" % (server_exe))
        sys.exit(-1)
    # prepare files to be served
    print("I will use the directory %s to store 2 files" % (root_dir))
    if not os.access(root_dir, os.W_OK):
        os.mkdir(root_dir)
    def make_synthetic_content(sz):
        return "0123456789ABCDEF" * int(sz / 16)
    def write_file(name, content):
        with open("%s/%s" % (root_dir, name), "wb") as sfile:
            sfile.write(content.encode("utf-8"))
            sfile.close()
    sfilecontent = make_synthetic_content(1024)
    write_file("small", sfilecontent)
    lfilecontent = make_synthetic_content(2250 * 1024)
    write_file("large", lfilecontent)
    wwwcscont = open("%s/res/www.cs.vt.edu-20200417.html" % script_dir).read()
    write_file("www.cs.vt.edu-20200417.html", wwwcscont)
    port = (os.getpid() % 10000) + 20000
    cmd = [server_exe, "-p", str(port), "-R", root_dir, "-s"]
    raise_fd_limit()
    raise_thread_limit()
    server = subprocess.Popen(cmd, stdout=open(os.devnull, "w"), stderr=sys.stderr)
    def clean_up_testing():
        try:
            os.kill(server.pid, signal.SIGKILL)
        except:
            pass
    atexit.register(clean_up_testing)
    print("I will now test that your server works.")
    def test_server():
        http_conn = HTTPConnection(hostname, port)
        http_conn.connect()
        for url, expected in zip(
            ["/small", "/large", "/www.cs.vt.edu-20200417.html", "/api/login"],
            [sfilecontent, lfilecontent, wwwcscont, "{}"],
        ):
            http_conn.request("GET", url)
            server_response = http_conn.getresponse()
            sfile = server_response.read().decode("utf-8")
            if server_response.status != OK:
                print(
                    "Server returned %s for %s, expected %d."
                    % (server_response.status, url, OK)
                )
                sys.exit(-1)
            if (
                isinstance(expected, int)
                and len(sfile) >= expected
                or isinstance(expected, (str, bytes))
                and sfile == expected
            ):
                print("Retrieved %s ok." % (url))
            else:
                print("Did not find expected content at %s." % (url))
                sys.exit(-1)
        http_conn.close()
    for tries in range(10):
        try:
            time.sleep(1)
            test_server()
            break
        except Exception as e:
            print(f'starting server failed: {e}')
            pass
    if tries == 9:
        print("Your server did not start, giving up after 10 tries")
        sys.exit(0)
    this_script = os.path.realpath(sys.argv[0])
    print(
        f"""
 Congratulations, you are now ready to run the benchmark!
 Now, find another unloaded rlogin machine and run:
 {this_script} http://{hostname}:{port}/
 To use the ink tool, instead run 
 {this_script} -i http://{hostname}:{port}/
 When you are done, don't forget to hit ^C here.
 Your server's stdout is going to /dev/null.
 Your server's stderr is going to the driver's stderr.
 """
    )
    sys.stdout.flush()
    server.wait()
 def start_wrk(url, test):
    cmd = [ wrk_exe ]
    cmd += [] if useInk else ['--no-trace']
    cmd += [
        "-c", str(test.nconnections),
        "-t", str(test.nthreads),
        "-d", test.duration,
        "-r", test.name + ".tar",
        "-x", test.timeout,
        "-w", str(test.window),
        "-o", str(test.overlap),
        "-s", script_dir + "/cs3214bench.lua",
        url + test.path,
    ]
    if verbose:
        print("I will now run", " ".join(cmd))
    resfile = "ssresults.json"
    luajson = "%s/JSON.lua" % script_dir
    assert os.access(luajson, os.R_OK)
    server = subprocess.Popen(
        cmd,
        stdout=sys.stdout,
        stderr=sys.stderr,
        env=dict(os.environ, JSON_OUTPUT_FILE=resfile, JSON_LUA=luajson),
    )
    server.wait()
    with open(resfile) as jfile:
        r = json.load(jfile)
        os.unlink(resfile)
        return r
 if len(args) == 0:
    start_server(server_root)
 else:
    url = args[0]
    # strip ending / since the path args contain them
    while url.endswith("/"):
        url = url[:-1]
    if hostname in url:
        print("Please do not start the client on the same machine as the server.")
        sys.exit(-1)
    raise_fd_limit()
    raise_thread_limit()
    results = dict(version=VERSION)
    ran = []
    for testname in teststorun:
        ran.append(testname)
        if testname not in testsbyname:
            print("Test: %s not found, skipping" % testname)
            continue
        test = testsbyname[testname]
        print("Now running test: %s\n" % (testname))
        try:
            results[testname] = start_wrk(url, test)
        except Exception as e:
            print("An exception occurred %s, skipping this test" % (str(e)))
    ofilename = "pserv.results.%d.json" % (os.getpid())
    print("Writing results to %s" % ofilename)
    with open(ofilename, "w") as ofile:
        json.dump(results, ofile)
    print(
        """
    Submit your results to the scoreboard with ~cs3214/bin/sspostresults.py %s
        """
        % ofilename
    )
    with open(ofilename, "r") as f:
        data = json.load(f)
    score = 0
    # the following rubric encode the performance expectations for this semester
    # there are 20 pts currently, 4 pts per benchmark.
    #
    # If errors (p) is set, deduct p pts if there are one or more errors
    #
    # If served (a, b) is set, deduct b pts unless a fraction of a clients was served
    #
    rubric = {
        # 200 or more yields 4 pts, 100 or more yields 2 points
        "login40": {"rps": [(320, 4), (160, 2)], "errors": -1},
        "login500": {"rps": [(800, 4), (500, 2)], "errors": -1},
        "login10k": {"rps": [(650, 4), (450, 2)], "served": (0.80, 2)},
        # these max out the 10GBps link, so these are MByte/s
        "wwwcsvt100": {"mbps": [(900, 4), (800, 2)]},
        "doom100": {"mbps": [(900, 4), (800, 2)]},
    }
    extra = ""
    for test in ran:
        points = rubric[test]
        category = 0
        if "rps" in points:
            rps = 1e3 * (
                data[test]["summary"]["requests"] / data[test]["summary"]["duration"]
            )
            for requiredmin, value in points["rps"]:
                if rps > requiredmin:
                    category += value
                    break
            if test == "login10k" and rps > 900:
                extra = "+10 points extra credit for login10k! If your error count isn't > 5,000..."
        if "mbps" in points:
            mbps = (
                1e6
                * data[test]["summary"]["bytes"]
                / data[test]["summary"]["duration"]
                / 1024
                / 1024
            )
            for requiredmin, value in points["mbps"]:
                if mbps > requiredmin:
                    category += value
                    break
        if "served" in points:
            (threshold, deduction) = points["served"]
            percent = (
                data[test]["summary"]["served"] / data[test]["summary"]["connections"]
            )
            if percent < threshold:
                category = max(category - deduction, 0)
        if "errors" in rubric[test]:
            errors = sum(data[test]["summary"]["errors"].values())
            if errors > 0:
                category = max(category - rubric[test], 0)
        print("%s: %d/4" % (test, category))
        score += category
    print("Your server got a performance score of %d/20" % score)
    if extra != "":
        print(extra)
    print(
        """
    Submit your individual <test_name>.tar reports with ~cs3214/bin/p4api.sh\nThis will return a link to visualize your server's performance.
        """
    )