yuvalif · May 31, 2022 17:03 · yuvalif · May 30, 2022 · yuvalif · May 30, 2022
diff --git a/manual-rgw-scaling.md b/manual-rgw-scaling.md
diff --git a/metrics.py b/metrics.py
 import subprocess
 import time
 import sys

 rolling_lat_sum_arr1 = [0.0 for i in range(5)] 
 rolling_lat_count_arr1 = [0 for i in range(5)] 

 rolling_lat_sum_arr2 = [0.0 for i in range(5)]
 rolling_lat_count_arr2 = [0 for i in range(5)] 

 def system(cmd):
  output = subprocess.check_output(cmd, shell=True).decode(sys.stdout.encoding).strip()
  return output

 while True:
  pid = system('pgrep radosgw | head -1')
  cpu1 = system('top -p '+pid+' -b -n 1 | ag radosgw | awk \'{print $9}\'')
  qlen1 = system('./bin/ceph --admin-daemon out/radosgw.8000.asok perf dump 2>/dev/null | jq .rgw.qlen')
  lat_count = int(system('./bin/ceph --admin-daemon out/radosgw.8000.asok perf dump 2>/dev/null | jq .rgw.put_initial_lat.avgcount'))
  lat_sum = float(system('./bin/ceph --admin-daemon out/radosgw.8000.asok perf dump 2>/dev/null | jq .rgw.put_initial_lat.sum'))
  for i in range(4, 0, -1):
    rolling_lat_count_arr1[i] = rolling_lat_count_arr1[i-1]
    rolling_lat_sum_arr1[i] = rolling_lat_sum_arr1[i-1]
  
  rolling_lat_count_arr1[0] = lat_count
  rolling_lat_sum_arr1[0] = lat_sum
  sum_diff = rolling_lat_sum_arr1[0] - rolling_lat_sum_arr1[4]
  count_diff = rolling_lat_count_arr1[0] - rolling_lat_count_arr1[4]
  if count_diff == 0:
    latency1 = 0.0
  else:
    latency1 = sum_diff/count_diff

  pid = system('pgrep radosgw | tail -n -1')
  cpu2 = system('top -p '+pid+' -b -n 1 | ag radosgw | awk \'{print $9}\'')
  qlen2 = system('./bin/ceph --admin-daemon out/radosgw.8001.asok perf dump 2>/dev/null | jq .rgw.qlen')
  lat_count = int(system('./bin/ceph --admin-daemon out/radosgw.8001.asok perf dump 2>/dev/null | jq .rgw.put_initial_lat.avgcount'))
  lat_sum = float(system('./bin/ceph --admin-daemon out/radosgw.8001.asok perf dump 2>/dev/null | jq .rgw.put_initial_lat.sum'))
  for i in range(4, 0, -1):
    rolling_lat_count_arr2[i] = rolling_lat_count_arr2[i-1]
    rolling_lat_sum_arr2[i] = rolling_lat_sum_arr2[i-1]
  
  rolling_lat_count_arr2[0] = lat_count
  rolling_lat_sum_arr2[0] = lat_sum
  sum_diff = rolling_lat_sum_arr2[0] - rolling_lat_sum_arr2[4]
  count_diff = rolling_lat_count_arr2[0] - rolling_lat_count_arr2[4]
  if count_diff <= 0:
    latency2 = 0.0
  else:
    latency2 = sum_diff/count_diff

  print(qlen1, '%.2f'%latency1, cpu1, qlen2, '%.2f'%latency2, cpu2)
  time.sleep(1)
diff --git a/upload.sh b/upload.sh
 #!/bin/bash

 if [ "$#" -ne 1 ]; then
        echo "Usage: $0 <#RGWs>"
        exit 1
 fi

 num_of_rgw=$1

 echo "generating 1GB file"
 head -c 1G </dev/urandom > myfile

 host1=localhost:8000
 if [ $num_of_rgw == 1 ]; then
  echo "uploading all objects to: $host1"
  host2=$host1
 else
  echo "uploading objects to: $host1 and: $host2"
  host2=localhost:8001
 fi
 access=0555b35654ad1656d804
 secret=h7GhxuBLTrlhVUyxSPUKUV8r/2EI4ngqJxD7iBdBYLhwluN30JaT3Q==

 s3cmd --no-ssl --host=$host1 --host-bucket="$host1%(bucket)" --access_key=$access --secret_key=$secret mb s3://mybucket

 start_time=$(date +%s)

 for i in {1..400}; do
  prefix=$(cat /dev/urandom | tr -cd 'a-f0-9' | head -c 5)
  sleep 0.1
  s3cmd --no-ssl --host=$host1 --host-bucket="$host1/%(bucket)" --access_key=$access --secret_key=$secret put myfile s3://mybucket/$prefix & 
  pids[${i}]=$!
 done


 for i in {1..400}; do
  prefix=$(cat /dev/urandom | tr -cd 'a-f0-9' | head -c 5)
  sleep 0.1
  s3cmd --no-ssl --host=$host2 --host-bucket="$host2/%(bucket)" --access_key=$access --secret_key=$secret put myfile s3://mybucket/$prefix & 
  pids[${i}]=$!
 done

 for pid in ${pids[*]}; do
  wait $pid
 done

 end_time=$(date +%s)

 echo "================="
 echo "Overall time is: " $((end_time-start_time)) "seconds"
 echo "================="
	import subprocess
	import time
	import sys

	rolling_lat_sum_arr1 = [0.0 for i in range(5)]
	rolling_lat_count_arr1 = [0 for i in range(5)]

	rolling_lat_sum_arr2 = [0.0 for i in range(5)]
	rolling_lat_count_arr2 = [0 for i in range(5)]

	def system(cmd):
	output = subprocess.check_output(cmd, shell=True).decode(sys.stdout.encoding).strip()
	return output

	while True:
	pid = system('pgrep radosgw \| head -1')
	cpu1 = system('top -p '+pid+' -b -n 1 \| ag radosgw \| awk \'{print $9}\'')
	qlen1 = system('./bin/ceph --admin-daemon out/radosgw.8000.asok perf dump 2>/dev/null \| jq .rgw.qlen')
	lat_count = int(system('./bin/ceph --admin-daemon out/radosgw.8000.asok perf dump 2>/dev/null \| jq .rgw.put_initial_lat.avgcount'))
	lat_sum = float(system('./bin/ceph --admin-daemon out/radosgw.8000.asok perf dump 2>/dev/null \| jq .rgw.put_initial_lat.sum'))
	for i in range(4, 0, -1):
	rolling_lat_count_arr1[i] = rolling_lat_count_arr1[i-1]
	rolling_lat_sum_arr1[i] = rolling_lat_sum_arr1[i-1]

	rolling_lat_count_arr1[0] = lat_count
	rolling_lat_sum_arr1[0] = lat_sum
	sum_diff = rolling_lat_sum_arr1[0] - rolling_lat_sum_arr1[4]
	count_diff = rolling_lat_count_arr1[0] - rolling_lat_count_arr1[4]
	if count_diff == 0:
	latency1 = 0.0
	else:
	latency1 = sum_diff/count_diff

	pid = system('pgrep radosgw \| tail -n -1')
	cpu2 = system('top -p '+pid+' -b -n 1 \| ag radosgw \| awk \'{print $9}\'')
	qlen2 = system('./bin/ceph --admin-daemon out/radosgw.8001.asok perf dump 2>/dev/null \| jq .rgw.qlen')
	lat_count = int(system('./bin/ceph --admin-daemon out/radosgw.8001.asok perf dump 2>/dev/null \| jq .rgw.put_initial_lat.avgcount'))
	lat_sum = float(system('./bin/ceph --admin-daemon out/radosgw.8001.asok perf dump 2>/dev/null \| jq .rgw.put_initial_lat.sum'))
	for i in range(4, 0, -1):
	rolling_lat_count_arr2[i] = rolling_lat_count_arr2[i-1]
	rolling_lat_sum_arr2[i] = rolling_lat_sum_arr2[i-1]

	rolling_lat_count_arr2[0] = lat_count
	rolling_lat_sum_arr2[0] = lat_sum
	sum_diff = rolling_lat_sum_arr2[0] - rolling_lat_sum_arr2[4]
	count_diff = rolling_lat_count_arr2[0] - rolling_lat_count_arr2[4]
	if count_diff <= 0:
	latency2 = 0.0
	else:
	latency2 = sum_diff/count_diff

	print(qlen1, '%.2f'%latency1, cpu1, qlen2, '%.2f'%latency2, cpu2)
	time.sleep(1)
	#!/bin/bash

	if [ "$#" -ne 1 ]; then
	echo "Usage: $0 <#RGWs>"
	exit 1
	fi

	num_of_rgw=$1

	echo "generating 1GB file"
	head -c 1G </dev/urandom > myfile

	host1=localhost:8000
	if [ $num_of_rgw == 1 ]; then
	echo "uploading all objects to: $host1"
	host2=$host1
	else
	echo "uploading objects to: $host1 and: $host2"
	host2=localhost:8001
	fi
	access=0555b35654ad1656d804
	secret=h7GhxuBLTrlhVUyxSPUKUV8r/2EI4ngqJxD7iBdBYLhwluN30JaT3Q==

	s3cmd --no-ssl --host=$host1 --host-bucket="$host1%(bucket)" --access_key=$access --secret_key=$secret mb s3://mybucket

	start_time=$(date +%s)

	for i in {1..400}; do
	prefix=$(cat /dev/urandom \| tr -cd 'a-f0-9' \| head -c 5)
	sleep 0.1
	s3cmd --no-ssl --host=$host1 --host-bucket="$host1/%(bucket)" --access_key=$access --secret_key=$secret put myfile s3://mybucket/$prefix &
	pids[${i}]=$!
	done


	for i in {1..400}; do
	prefix=$(cat /dev/urandom \| tr -cd 'a-f0-9' \| head -c 5)
	sleep 0.1
	s3cmd --no-ssl --host=$host2 --host-bucket="$host2/%(bucket)" --access_key=$access --secret_key=$secret put myfile s3://mybucket/$prefix &
	pids[${i}]=$!
	done

	for pid in ${pids[*]}; do
	wait $pid
	done

	end_time=$(date +%s)

	echo "================="
	echo "Overall time is: " $((end_time-start_time)) "seconds"
	echo "================="