pcolazurdo · March 16, 2020 19:16
diff --git a/transcribe.sh b/transcribe.sh
 YT_FILE=poX6BEzVmdE
 BUCKET_NAME="Please define the Bucket where the output will be sent - you can also use paths if needed"
 FILE_OUTPUT=`youtube-dl -o '%(id)s.%(ext)s' --restrict-filenames https://www.youtube.com/watch\?v\=${YT_FILE} | grep "[download] Destination:" | cut -d: -f1`

 aws s3 cp ${FILE_OUTPUT} s3://${BUCKET_NAME}/${YT_FILE}
 aws transcribe start-transcription-job --transcription-job-name ${YT_FILE} --language-code en-GB --media MediaFileUri=s3://${BUCKET_NAME}/${YT_FILE} --output-bucket-name ${BUCKET_NAME}


 sleep 120 #or use list-transcript-jobs until it is completed

 aws s3 cp s3://${BUCKET_NAME}/${YT_FILE}.json .
 cat ${YT_FILE}.json | jq -r '.results.transcripts[].transcript'
	YT_FILE=poX6BEzVmdE
	BUCKET_NAME="Please define the Bucket where the output will be sent - you can also use paths if needed"
	FILE_OUTPUT=`youtube-dl -o '%(id)s.%(ext)s' --restrict-filenames https://www.youtube.com/watch\?v\=${YT_FILE} \| grep "[download] Destination:" \| cut -d: -f1`

	aws s3 cp ${FILE_OUTPUT} s3://${BUCKET_NAME}/${YT_FILE}
	aws transcribe start-transcription-job --transcription-job-name ${YT_FILE} --language-code en-GB --media MediaFileUri=s3://${BUCKET_NAME}/${YT_FILE} --output-bucket-name ${BUCKET_NAME}


	sleep 120 #or use list-transcript-jobs until it is completed

	aws s3 cp s3://${BUCKET_NAME}/${YT_FILE}.json .
	cat ${YT_FILE}.json \| jq -r '.results.transcripts[].transcript'