stephanie-wang · April 7, 2020 21:04
diff --git a/video_benchmark.py b/video_benchmark.py
 import subprocess
 import cv2
 import os.path
 import numpy as np
 import time
 import json
 import threading
 import tempfile

 import ray
 import ray.cluster_utils

 OUTPUT_DIR = "/home/swang/data/images"
 TEST_VIDEO = "/home/swang/data/test.mp4"

 NUM_FRAMES_PER_CHUNK = 10
 MAX_FRAMES = 1200.0

 CLEANUP = False

 MSE_THRESHOLD = 70

 def get_chunk_file(chunk_index, frame):
    frame = chunk_index * NUM_FRAMES_PER_CHUNK + frame
    filename = os.path.join(OUTPUT_DIR, "image-{:06d}.png".format(frame))
    return filename

 @ray.remote(resources={"query": 1})
 def process_frame(frame):
    time.sleep(0.2)
    return "a result"

 @ray.remote(resources={"preprocess": 1})
 def load_frames(filename):
    image = cv2.imread(filename)
    assert image is not None
    image = cv2.resize(image, (416, 416))
    return image

 @ray.remote(resources={"preprocess": 1})
 def load_frames(filename, start_frame, num_frames):
    v = cv2.VideoCapture(filename)
    v.set(cv2.CAP_PROP_POS_FRAMES, start_frame)
    frames = []
    for _ in range(num_frames):
        grabbed, frame = v.read()
        assert grabbed
        frames.append(frame)
    return frames

 @ray.remote(resources={"preprocess": 1})
 def compute_mse(frame1, frame2):
    return np.square(frame1 - frame2).mean()

 @ray.remote(resources={"preprocess": 1})
 def process_chunk(filename, start_frame, num_frames):
    frames = load_frames.options(num_return_vals=num_frames).remote(filename, start_frame, num_frames)

    last_frame_index = None
    results = []
    for i, frame in enumerate(frames):
        mse = MSE_THRESHOLD
        if last_frame_index is not None:
            mse = ray.get(compute_mse.remote(frame, frames[last_frame_index]))
        if mse < MSE_THRESHOLD:
            results.append(results[last_frame_index])
        else:
            results.append(process_frame.remote(frame))
            last_frame_index = i
            if i != 0:
                print("switch frame", i)
    return ray.get(results)


 def cleanup_chunk(chunk_index, num_frames):
    for frame in range(num_frames, 0, -1):
        filename = get_chunk_file(chunk_index, frame)
        os.remove(filename)


 def process_video(video_pathname, num_total_frames):
    results = []
    futures = []
    start_frame = 0
    while start_frame < num_total_frames:
        if len(futures) >= 4:
            results += ray.get(futures.pop(0))
        print("Processing chunk at index", start_frame)
        num_frames = min(NUM_FRAMES_PER_CHUNK, num_total_frames - start_frame)
        futures.append(process_chunk.remote(video_pathname, start_frame, num_frames))
        start_frame += num_frames

    for f in futures:
        results += ray.get(f)

    if CLEANUP:
        for i in range(chunk_index):
            cleanup_chunk(i, NUM_FRAMES_PER_CHUNK)


 def main(test_failure):
    internal_config = json.dumps({
        "initial_reconstruction_timeout_milliseconds": 100000,
        "num_heartbeats_timeout": 10,
        "lineage_pinning_enabled": 1,
        "free_objects_period_milliseconds": -1,
        "object_manager_repeated_push_delay_ms": 1000,
    })
    cluster = ray.cluster_utils.Cluster()
    cluster.add_node(num_cpus=0, _internal_config=internal_config)
    preprocess_nodes = [cluster.add_node(object_store_memory=10**9, num_cpus=2, resources={"preprocess": 100}, _internal_config=internal_config) for _ in range(2)]
    query_nodes = [cluster.add_node(object_store_memory=10**9, num_cpus=2, resources={"query": 100}, _internal_config=internal_config) for _ in range(1)]
    cluster.wait_for_nodes()
    

    ray.init(address=cluster.address)
    start = time.time()

    v = cv2.VideoCapture(TEST_VIDEO)
    num_total_frames = min(v.get(cv2.CAP_PROP_FRAME_COUNT), MAX_FRAMES)
    print("FRAMES", num_total_frames)
    t = threading.Thread(target=process_video, args=(TEST_VIDEO, num_total_frames))
    t.start()

    if test_failure:
        time.sleep(5)
        cluster.remove_node(preprocess_nodes[-1], allow_graceful=False)
        time.sleep(1)
        cluster.add_node(num_cpus=2, resources={"preprocess": 100}, _internal_config=internal_config)

    t.join()

    end = time.time()
    print("Finished in", end - start)
    print("Throughput:", num_total_frames / (end - start))

    ray.timeline(filename="dump.json")

 if __name__ == "__main__":
    import argparse
    parser = argparse.ArgumentParser(description='Run the video benchmark.')

    parser.add_argument("--failure", action="store_true")
    args = parser.parse_args()
    main(args.failure)
	import subprocess
	import cv2
	import os.path
	import numpy as np
	import time
	import json
	import threading
	import tempfile

	import ray
	import ray.cluster_utils

	OUTPUT_DIR = "/home/swang/data/images"
	TEST_VIDEO = "/home/swang/data/test.mp4"

	NUM_FRAMES_PER_CHUNK = 10
	MAX_FRAMES = 1200.0

	CLEANUP = False

	MSE_THRESHOLD = 70

	def get_chunk_file(chunk_index, frame):
	frame = chunk_index * NUM_FRAMES_PER_CHUNK + frame
	filename = os.path.join(OUTPUT_DIR, "image-{:06d}.png".format(frame))
	return filename

	@ray.remote(resources={"query": 1})
	def process_frame(frame):
	time.sleep(0.2)
	return "a result"

	@ray.remote(resources={"preprocess": 1})
	def load_frames(filename):
	image = cv2.imread(filename)
	assert image is not None
	image = cv2.resize(image, (416, 416))
	return image

	@ray.remote(resources={"preprocess": 1})
	def load_frames(filename, start_frame, num_frames):
	v = cv2.VideoCapture(filename)
	v.set(cv2.CAP_PROP_POS_FRAMES, start_frame)
	frames = []
	for _ in range(num_frames):
	grabbed, frame = v.read()
	assert grabbed
	frames.append(frame)
	return frames

	@ray.remote(resources={"preprocess": 1})
	def compute_mse(frame1, frame2):
	return np.square(frame1 - frame2).mean()

	@ray.remote(resources={"preprocess": 1})
	def process_chunk(filename, start_frame, num_frames):
	frames = load_frames.options(num_return_vals=num_frames).remote(filename, start_frame, num_frames)

	last_frame_index = None
	results = []
	for i, frame in enumerate(frames):
	mse = MSE_THRESHOLD
	if last_frame_index is not None:
	mse = ray.get(compute_mse.remote(frame, frames[last_frame_index]))
	if mse < MSE_THRESHOLD:
	results.append(results[last_frame_index])
	else:
	results.append(process_frame.remote(frame))
	last_frame_index = i
	if i != 0:
	print("switch frame", i)
	return ray.get(results)


	def cleanup_chunk(chunk_index, num_frames):
	for frame in range(num_frames, 0, -1):
	filename = get_chunk_file(chunk_index, frame)
	os.remove(filename)


	def process_video(video_pathname, num_total_frames):
	results = []
	futures = []
	start_frame = 0
	while start_frame < num_total_frames:
	if len(futures) >= 4:
	results += ray.get(futures.pop(0))
	print("Processing chunk at index", start_frame)
	num_frames = min(NUM_FRAMES_PER_CHUNK, num_total_frames - start_frame)
	futures.append(process_chunk.remote(video_pathname, start_frame, num_frames))
	start_frame += num_frames

	for f in futures:
	results += ray.get(f)

	if CLEANUP:
	for i in range(chunk_index):
	cleanup_chunk(i, NUM_FRAMES_PER_CHUNK)


	def main(test_failure):
	internal_config = json.dumps({
	"initial_reconstruction_timeout_milliseconds": 100000,
	"num_heartbeats_timeout": 10,
	"lineage_pinning_enabled": 1,
	"free_objects_period_milliseconds": -1,
	"object_manager_repeated_push_delay_ms": 1000,
	})
	cluster = ray.cluster_utils.Cluster()
	cluster.add_node(num_cpus=0, _internal_config=internal_config)
	preprocess_nodes = [cluster.add_node(object_store_memory=10**9, num_cpus=2, resources={"preprocess": 100}, _internal_config=internal_config) for _ in range(2)]
	query_nodes = [cluster.add_node(object_store_memory=10**9, num_cpus=2, resources={"query": 100}, _internal_config=internal_config) for _ in range(1)]
	cluster.wait_for_nodes()


	ray.init(address=cluster.address)
	start = time.time()

	v = cv2.VideoCapture(TEST_VIDEO)
	num_total_frames = min(v.get(cv2.CAP_PROP_FRAME_COUNT), MAX_FRAMES)
	print("FRAMES", num_total_frames)
	t = threading.Thread(target=process_video, args=(TEST_VIDEO, num_total_frames))
	t.start()

	if test_failure:
	time.sleep(5)
	cluster.remove_node(preprocess_nodes[-1], allow_graceful=False)
	time.sleep(1)
	cluster.add_node(num_cpus=2, resources={"preprocess": 100}, _internal_config=internal_config)

	t.join()

	end = time.time()
	print("Finished in", end - start)
	print("Throughput:", num_total_frames / (end - start))

	ray.timeline(filename="dump.json")

	if __name__ == "__main__":
	import argparse
	parser = argparse.ArgumentParser(description='Run the video benchmark.')

	parser.add_argument("--failure", action="store_true")
	args = parser.parse_args()
	main(args.failure)
No results found