Focusing

Kung-Hsiang Steeve Huang khuangaf

Focusing

Research Scientist @ Salesforce Research | Formerly: PhD @ UIUC, PhD Fellow @ Amazon, MSc @ USC, BEng @ HKUST | He/him/his 🇹🇼

khuangaf / gist:af7e9de7577959af84bda6bfe895a62c

Created August 26, 2018 12:48

	def second2timecode(time):
	'''Convert second into time code for srt.'''
	hours = time // 3600
	time -= 3600 * hours
	minutes = time // 60
	time -= 60 * minutes
	secs = np.floor(time % 60)
	msecs = (time % 60 - secs) * 1000
	timecode = "%02d:%02d:%02d,%03d" % (hours, minutes, secs, msecs)
	return timecode

khuangaf / gist:4c40784cc506ae8d43188089be25177c

Created August 26, 2018 12:24

	def same_subtitle(current_subtitle, next_subtitle):
	'''Return true if the two given subtitles are the same (but can tolerate a bit difference)'''
	# convert the two subtitle into set e.g. '我很乖' -> {'我','很','乖'}
	current_set = set(current_subtitle)
	next_set = set(next_subtitle)
	current_set_len = len(current_set)
	next_set_len = len(next_set)
	intersect_set = current_set & next_set
	intersect_set_len = len(intersect_set)

khuangaf / gist:f1b65d67525e4eb32ac4373cb6aed621

Created August 26, 2018 03:48

	df = pd.DataFrame(columns=['id', 'prediction', 'confidence'])
	df['id'] = image_ids
	df['prediction'] = predictions
	df['confidence'] = confidences
	df.to_csv(f'{args.results_dir}/{video_id}.csv', index=None)

khuangaf / gist:37394b1ff250c4a10b10844e2528d98e

Last active August 26, 2018 03:42

	# the endpoint of the api
	ENDPOINT_URL = 'https://vision.googleapis.com/v1p1beta1/images:annotate'
	# the api key
	os.environ['GOOGLE_APPLICATION_CREDENTIALS']='your/path/to/credentials.json'
	# init api client
	client = vision.ImageAnnotatorClient()

	with io.open(YOUR_IMAGE_PATH, 'rb') as f:
	content = f.read()
	image = vision.types.Image(content=content)

khuangaf / gist:8fdecdae70a1534252b45f396f5c91b3

Created August 24, 2018 14:48

	class SubtitleConfig(Config):
	"""Configuration for training on the nucleus segmentation dataset."""
	# Give the configuration a recognizable name
	NAME = "subtitle"

	# Adjust depending on your GPU memory
	IMAGES_PER_GPU = 4

	# Number of classes (including background)
	NUM_CLASSES = 1 + 1 # Background + subtitle

khuangaf / gist:a67c65c6b7b48f96fe5a01114fce2aab

Last active August 24, 2018 14:40

	def get_multi_masks(img):
	'''
	Get connected components (multi-masks)
	args:
	img: np.ndarray
	return:
	np.ndarray with same dimension as the input
	'''

	# Threshold the image to make it become either 0 or 1

khuangaf / gist:7eba0599543c2a1ba34ad8cc9159fd45

Created August 22, 2018 14:25

	def video2frames(video_id, video_path, processed_videos_dir, frame_path, sample_rate):
	"""
	Execute shell command which calls ffmpeg to split video into frames.
	Parameters
	----------
	video_id : str
	The video id of a video
	video_path: str
	The directory storing the videos
	processed_video_path: str

khuangaf / gist:3aaa7100764a5ce23c509c77a6d97490

Created August 22, 2018 12:58

	def extract_audio(video_id,videos_dir, audios_dir):
	"""
	Download the videos
	Parameters
	----------
	video_id : str
	A Youtube video id.
	videos_dir: str
	The directory which stores videos.
	audios_dir: str

khuangaf / gist:0e6d3c9d55f7eb70e4de47951749eebe

Last active August 22, 2018 12:55

	def download_video(video_id, path="videos", verbose=True):

	"""
	Download the videos
	Parameters
	----------
	video_id : str
	A Youtube video id.
	path: str
	The directory which stores videos.

khuangaf / gist:66a8cafc6b7675183944e793e0ebeca6

Created August 22, 2018 12:49

	def get_video_ids(playlist_id):
	"""
	Get the video ids given a playlist id.
	Parameters
	----------
	playlist_id : str
	A Youtube playlist id. (up to 50 results)
	Returns
	-------
	video_ids: list(str)