Created
October 28, 2017 22:13
-
-
Save atomize/14a0f61f96e33a8c0f2207bfd6c2c163 to your computer and use it in GitHub Desktop.
CSV to JSON converter using BASH -- best one from updates in comments of https://gist.github.com/dsliberty/3de707bc656cf757a0cb
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#!/bin/bash | |
# CSV to JSON converter using BASH | |
# original script from https://gist.github.com/dsliberty/3de707bc656cf757a0cb | |
# Usage ./csv2json.sh input.csv > output.json | |
#set -x | |
shopt -s extglob | |
input="${1:-}" | |
SEP="," | |
[ -z "${input}" ] && echo "No CSV input file specified" && exit 1 | |
[ ! -e "${input}" ] && echo "Unable to locate ${input}" && exit 1 | |
csv_nextField() | |
{ | |
local line="$(echo "${1}" | sed 's/\r//g')" | |
local start=0 | |
local stop=0 | |
if [[ -z "${line}" ]]; then | |
return 0 | |
fi | |
local offset=0 | |
local inQuotes=0 | |
while [[ -n "${line}" ]]; do | |
local char="${line:0:1}" | |
line="${line:1}" | |
if [[ "${char}" == "${SEP}" && ${inQuotes} -eq 0 ]]; then | |
inQuotes=0 | |
break | |
elif [[ "${char}" == '"' ]]; then | |
if [[ ${inQuotes} -eq 1 ]]; then | |
inQuotes=0 | |
else | |
inQuotes=1 | |
fi | |
else | |
echo -n "${char}" | |
fi | |
offset=$(( ${offset} + 1 )) | |
done | |
echo "" | |
return $(( ${offset} + 1 )) | |
} | |
read first_line < "${input}" | |
a=0 | |
headings=`echo ${first_line} | awk -F"${SEP}" {'print NF'}` | |
lines=`cat "${input}" | wc -l` | |
while [[ ${a} -lt ${headings} ]]; do | |
field="$(csv_nextField "${first_line}")" | |
first_line="${first_line:${?}}" | |
head_array[${a}]="${field}" | |
a=$(( ${a} + 1 )) | |
done | |
c=0 | |
echo "[" | |
while [ ${c} -lt ${lines} ] | |
do | |
read each_line | |
each_line="$(echo "${each_line}" | sed 's/\r//g')" | |
if [[ ${c} -eq 0 ]]; then | |
c=$(( ${c} + 1 )) | |
else | |
d=0 | |
echo " {" | |
while [[ ${d} -lt ${headings} ]]; do | |
item="$(csv_nextField "${each_line}")" | |
each_line="${each_line:${?}}" | |
echo -n " \"${head_array[${d}]}\": " | |
case "${item}" in | |
"") | |
echo -n "null" | |
;; | |
null|true|false|\"*\"|+([0123456789])) | |
echo -n ${item} | |
;; | |
*) | |
echo -n "\"${item}\"" | |
;; | |
esac | |
d=$(( ${d} + 1 )) | |
[[ ${d} -lt ${headings} ]] && echo "," || echo "" | |
done | |
echo -n " }" | |
c=$(( ${c} + 1 )) | |
[[ ${c} -lt ${lines} ]] && echo "," || echo "" | |
fi | |
done < "${input}" | |
echo "]" |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment