Nemo157 · March 26, 2024 20:46
diff --git a/_Publishing crates to IPFS.md b/_Publishing crates to IPFS.md
diff --git a/publish b/publish
 #!/usr/bin/env zsh

 # This requires a custom version of `rq` that you can install via
 #
 #     cargo install record-query --git https://github.com/Nemo157/rq --branch tables-last
 #
 # Other than that it requires some utilities you should get from your package
 # manager:
 #
 #  - `jq`
 #  - `ipfs` (and a running daemon)
 #  - `tar`
 #  - `git`

 set -euo pipefail

 export seen=${seen:-$(mktemp /tmp/ipfs-registry.seen.XXXXXX)}

 export crate=${1:?crate}
 export version=${2:?version}

 export IPFS_GATEWAY=${IPFS_GATEWAY:-http://127.0.0.1:8080/}

 # Track the root crate we're publishing
 if ! test -v root
 then
  export root=$crate-$version
  export chain=$root
  export cache_root=cache/${IPFS_GATEWAY//[^0-9a-zA-Z]/_}/$root
  mkdir -p $cache_root
  mkdir -p crates

  echo "Starting publish for $crate-$version and dependencies to $IPFS_GATEWAY" >&2
 else
  export chain=${chain}:$crate-$version
 fi

 trap '
  if test $? -ne 0
  then
    echo "Failed during $chain" >&2
  fi
 ' EXIT

 debug() {
  if test ${DEBUG:-0} -eq 1
  then
    "$@" >&2
  else
    "$@" >&/dev/null
  fi
 }

 cache=$cache_root/$crate-$version

 # If we've already rewritten this crate, return the cached hash, caching must be
 # per-root since the root determines allowed deps, and per-gateway
 if test -e $cache.index
 then
  hash=$(cat $cache.index)
 else
  # If we've already visited this crate this run, and it was _not_ cached, we have
  # a loop
  if grep -Fxq $crate-$version $seen
  then
    echo "Loop detected at $chain" >&2
    exit 1
  fi
  echo $crate-$version >> $seen

  echo "Rewriting $crate-$version" >&2

  # Check if we've already downloaded this crate to the cache
  if ! test -e crates/$crate-$version.tar.gz
  then
    echo "Downloading $crate-$version" >&2
    debug cargo download -o crates/$crate-$version.tar.gz $crate==$version
  fi

  # Extract sources so we can find all the dependencies
  tmp=$(mktemp -d /tmp/ipfs-registry.$crate-$version.XXXXXX)
  tar xzf crates/$crate-$version.tar.gz -C $tmp

  # Remove dev-dependencies because they always involve a dependency loop
  mv $tmp/$crate-$version/Cargo.toml $tmp/$crate-$version/Cargo.toml.orig2
  cat $tmp/$crate-$version/Cargo.toml.orig2 \
    | rq --input-toml --output-json \
    | jq '
        . as $root
        | ([(.["dev-dependencies"] // {}) | keys | .[]]) as $devdeps
        | $root
        | .features = (
          (.features // {})
          | map_values([
            .[]
            | split("/")[0] as $dep
            | . as $feat
            | select(
              ([$devdeps[] | . == $dep] | any) == false
            )
          ])
        )
        | del(.["dev-dependencies"])
        | .target = (
          (.target // {})
          | map_values(
            del(.["dev-dependencies"])
          )
        )
      ' \
    | rq --input-json --output-toml \
    > $tmp/$crate-$version/Cargo.toml
  rm -f $tmp/$crate-$version/Cargo.lock
  debug cargo update --manifest-path $tmp/$crate-$version/Cargo.toml

  # If this is the root crate collect all allowed dependencies
  if test $root = $crate-$version
  then
    export allowed="$(set -e; cargo metadata \
        --all-features \
        --format-version 1 \
        --manifest-path $tmp/$crate-$version/Cargo.toml \
        | jq -r '.packages[] | "[\(.name)]"'
    )"
  fi

  # Remove non-allowed dependencies
  mv $tmp/$crate-$version/Cargo.toml $tmp/$crate-$version/Cargo.toml.orig2
  cat $tmp/$crate-$version/Cargo.toml.orig2 \
    | rq --input-toml --output-json \
    | jq '
        def filter_allowed:
          select(.value.package // .key | inside(env.allowed))
        ;

        . as $root
        | (.features | keys | map("[\(.)]") | join(" ")) as $features
        | .features = (
          (.features // {})
          | map_values([ .[] | select(
            (split("/")[0] | "[\(.)]" | inside($features))
            or
            (split("/")[0] | "[\(.)]" | inside(env.allowed))
          ) ])
        )
        | .features = (
            (.features // {}) + (
              (.dependencies // {})
              | with_entries(
                select(.value.package // .key | inside(env.allowed) | not)
                | .value = []
              )
            )
          )
        | .dependencies = ((.dependencies // {}) | with_entries(filter_allowed))
        | .["build-dependencies"] = (
          (.["build-dependencies"] // {}) | with_entries(filter_allowed)
        )
        | .target = (
          (.target // {})
          | map_values(
            .dependencies = (
              (.dependencies // {}) | with_entries(filter_allowed)
            )
            | .["build-dependencies"] = (
              (.["build-dependencies"] // {}) | with_entries(filter_allowed)
            )
          )
        )
      ' \
    | rq --input-json --output-toml \
    > $tmp/$crate-$version/Cargo.toml
  rm -f $tmp/$crate-$version/Cargo.lock
  debug cargo update --manifest-path $tmp/$crate-$version/Cargo.toml

  uniq=${crate//-/_}_${version//[^0-9]/_}
  # Get the dependency tree and recursively rewrite them to get the hashes needed
  # to update this crate
  while IFS='|' read -r subcrate alias subversion
  do
    if ! test $crate-$version = $subcrate-$subversion; then
      lhash="$(./publish $subcrate $subversion)"
      export ${uniq}_hash_${alias//-/_}=$lhash
    fi
  done < <(set -e; cargo metadata \
        --all-features \
        --format-version 1 \
        --manifest-path $tmp/$crate-$version/Cargo.toml \
        | jq -r '
          . as $root
          | (.packages[] | select(.id == $root.resolve.root)) as $pkg
          | .resolve.nodes[]
          | select(.id == $root.resolve.root)
          | .deps[]
          | .pkg as $depid
          | ($root.packages[] | select(.id == $depid)) as $subpkg
          | ($pkg.dependencies[] | select(.name == $subpkg.name)) as $dep
          | {
            name: $subpkg.name,
            rename: ($dep.rename // $dep.name),
            version: $subpkg.version
          }
          | "\(.name)|\(.rename)|\(.version)"
        ')

  # Add registry entries to all dependencies
  mv $tmp/$crate-$version/Cargo.toml $tmp/$crate-$version/Cargo.toml.orig3
  cat $tmp/$crate-$version/Cargo.toml.orig3 \
    | rq --input-toml --output-json \
    | env uniq=$uniq jq '
        def add_registry:
          ($ENV["\(env.uniq)_hash_\(.key | gsub("-"; "_"))"]) as $hash
          | .value["registry-index"] = "\(env.IPFS_GATEWAY)/ipfs/\($hash)"
        ;

        .dependencies = ((.dependencies // {}) | with_entries(add_registry))
        | .["build-dependencies"] = (
          (.["build-dependencies"] // {}) | with_entries(add_registry)
        )
        | .target = (
          (.target // {})
          | map_values(
            .dependencies = (
              (.dependencies // {}) | with_entries(add_registry)
            )
            | .["build-dependencies"] = (
              (.["build-dependencies"] // {}) | with_entries(add_registry)
            )
          )
        )
      ' \
    | rq --input-json --output-toml \
    > $tmp/$crate-$version/Cargo.toml
  rm -f $tmp/$crate-$version/Cargo.lock
  debug cargo update --manifest-path $tmp/$crate-$version/Cargo.toml

  # build crate then repackage it for reproducibility
  RUSTFLAGS='--cap-lints allow' debug cargo package --no-verify --manifest-path $tmp/$crate-$version/Cargo.toml
  mkdir -p $tmp/package
  tar xzf $tmp/$crate-$version/target/package/$crate-$version.crate -C $tmp/package
  tar czf $tmp/package/$crate-$version.crate --mtime="$(stat --format=%y $tmp/package/$crate-$version/Cargo.toml.orig)" --clamp-mtime --sort=name -C $tmp/package $crate-$version

  # Publish crate file to ipfs
  export crate_hash=$(sha256sum $tmp/package/$crate-$version.crate | cut -d' ' -f 1)
  dl_hash=$(ipfs add --pin=false -wQ $tmp/package/$crate-$version.crate)

  # Inject a link from crate back to the dependencies indexes

  # Dunno how to programmatically make an empty dir dag node, so here's the hash
  # of one
  dir=QmUNLLsPACCz1vLxQVkXqqLX5R1X345qqfHbsf67hvA3Nn

  while IFS='=' read -r subcrate subhash
  do
    dir=$(ipfs object patch add-link $dir $subcrate $subhash)
  done < <(
    cat $tmp/$crate-$version/Cargo.toml \
      | rq --input-toml --output-json \
      | env uniq=$uniq jq -r '
          (., ((.target // {}) | .[]))
          | ((.dependencies // {}), (.["build-dependencies"] // {}))
          | to_entries | .[]
          | .key
          | "\(.)=\($ENV["\(env.uniq)_hash_\(. | gsub("-"; "_"))"])"
        '
  )
  dl_hash=$(ipfs object patch add-link $dl_hash .deps $dir)

  # Generate index
  git init $tmp/index >&/dev/null
  cat <<END > $tmp/index/config.json
  {
    "dl": "$IPFS_GATEWAY/ipfs/$dl_hash/{crate}-{version}.crate"
  }
 END

  gen_index() {
    cargo metadata \
        --all-features \
        --format-version 1 \
        --manifest-path $tmp/$crate-$version/Cargo.toml \
      | jq --compact-output '
          . as $root
          | .packages[]
          | select(.id == $root.resolve.root)
          | {
            name,
            vers: .version,
            deps: [
              .dependencies[]
              | select((.package // .name) | inside(env.allowed))
              | {
                name: (.rename // .name),
                package: (if .rename then .name else null end),
                req,
                features,
                optional,
                default_features: .uses_default_features,
                target,
                kind: (.kind // "normal"),
                registry,
              }
            ],
            cksum: env.crate_hash,
            features,
            yanked: false,
            links: null
          }
      '
  }

  if test ${#crate} -eq 1; then
    mkdir -p $tmp/index/1
    gen_index > $tmp/index/1/$crate
  elif test ${#crate} -eq 2; then
    mkdir -p $tmp/index/2
    gen_index > $tmp/index/2/$crate
  elif test ${#crate} -eq 3; then
    mkdir -p $tmp/index/3/${crate:0:1}
    gen_index > $tmp/index/3/${crate:0:1}/$crate
  else
    mkdir -p $tmp/index/${crate:0:2}/${crate:2:2}
    gen_index > $tmp/index/${crate:0:2}/${crate:2:2}/$crate
  fi

  git -C $tmp/index add . >/dev/null
  GIT_COMMITTER_DATE="2000-01-01 00:00:00" git -C $tmp/index commit -am "Add $crate-$version" --date="2000-01-01 00:00:00" >&/dev/null

  git clone --bare $tmp/index $tmp/index-bare >&/dev/null
  git -C $tmp/index-bare remote remove origin >&/dev/null
  git -C $tmp/index-bare update-server-info >&/dev/null

  hash=$(ipfs add --pin=false -rQ $tmp/index-bare)

  rm -rf $tmp

  # Inject a link from index back to the crate node
  hash=$(ipfs object patch add-link $hash .crates $dl_hash)

  printf "          %-40s dl    => %s\n" "$crate-$version" "$dl_hash" >&2
  printf "          %-40s index => %s\n" "$crate-$version" "$hash" >&2
  echo $dl_hash > $cache.dl
  echo $hash > $cache.index
 fi

 if test $root = $crate-$version
 then
  ipfs pin add $hash

  echo "
    $crate-$version published to $hash

    To use ensure you have this in your .cargo/config:

        [net]
        git-fetch-with-cli = true

    Then run

        cargo install $crate --index $IPFS_GATEWAY/ipfs/$hash

  "
 else
  echo $hash
 fi
	#!/usr/bin/env zsh

	# This requires a custom version of `rq` that you can install via
	#
	# cargo install record-query --git https://github.com/Nemo157/rq --branch tables-last
	#
	# Other than that it requires some utilities you should get from your package
	# manager:
	#
	# - `jq`
	# - `ipfs` (and a running daemon)
	# - `tar`
	# - `git`

	set -euo pipefail

	export seen=${seen:-$(mktemp /tmp/ipfs-registry.seen.XXXXXX)}

	export crate=${1:?crate}
	export version=${2:?version}

	export IPFS_GATEWAY=${IPFS_GATEWAY:-http://127.0.0.1:8080/}

	# Track the root crate we're publishing
	if ! test -v root
	then
	export root=$crate-$version
	export chain=$root
	export cache_root=cache/${IPFS_GATEWAY//[^0-9a-zA-Z]/_}/$root
	mkdir -p $cache_root
	mkdir -p crates

	echo "Starting publish for $crate-$version and dependencies to $IPFS_GATEWAY" >&2
	else
	export chain=${chain}:$crate-$version
	fi

	trap '
	if test $? -ne 0
	then
	echo "Failed during $chain" >&2
	fi
	' EXIT

	debug() {
	if test ${DEBUG:-0} -eq 1
	then
	"$@" >&2
	else
	"$@" >&/dev/null
	fi
	}

	cache=$cache_root/$crate-$version

	# If we've already rewritten this crate, return the cached hash, caching must be
	# per-root since the root determines allowed deps, and per-gateway
	if test -e $cache.index
	then
	hash=$(cat $cache.index)
	else
	# If we've already visited this crate this run, and it was _not_ cached, we have
	# a loop
	if grep -Fxq $crate-$version $seen
	then
	echo "Loop detected at $chain" >&2
	exit 1
	fi
	echo $crate-$version >> $seen

	echo "Rewriting $crate-$version" >&2

	# Check if we've already downloaded this crate to the cache
	if ! test -e crates/$crate-$version.tar.gz
	then
	echo "Downloading $crate-$version" >&2
	debug cargo download -o crates/$crate-$version.tar.gz $crate==$version
	fi

	# Extract sources so we can find all the dependencies
	tmp=$(mktemp -d /tmp/ipfs-registry.$crate-$version.XXXXXX)
	tar xzf crates/$crate-$version.tar.gz -C $tmp

	# Remove dev-dependencies because they always involve a dependency loop
	mv $tmp/$crate-$version/Cargo.toml $tmp/$crate-$version/Cargo.toml.orig2
	cat $tmp/$crate-$version/Cargo.toml.orig2 \
	\| rq --input-toml --output-json \
	\| jq '
	. as $root
	\| ([(.["dev-dependencies"] // {}) \| keys \| .[]]) as $devdeps
	\| $root
	\| .features = (
	(.features // {})
	\| map_values([
	.[]
	\| split("/")[0] as $dep
	\| . as $feat
	\| select(
	([$devdeps[] \| . == $dep] \| any) == false
	)
	])
	)
	\| del(.["dev-dependencies"])
	\| .target = (
	(.target // {})
	\| map_values(
	del(.["dev-dependencies"])
	)
	)
	' \
	\| rq --input-json --output-toml \
	> $tmp/$crate-$version/Cargo.toml
	rm -f $tmp/$crate-$version/Cargo.lock
	debug cargo update --manifest-path $tmp/$crate-$version/Cargo.toml

	# If this is the root crate collect all allowed dependencies
	if test $root = $crate-$version
	then
	export allowed="$(set -e; cargo metadata \
	--all-features \
	--format-version 1 \
	--manifest-path $tmp/$crate-$version/Cargo.toml \
	\| jq -r '.packages[] \| "[\(.name)]"'
	)"
	fi

	# Remove non-allowed dependencies
	mv $tmp/$crate-$version/Cargo.toml $tmp/$crate-$version/Cargo.toml.orig2
	cat $tmp/$crate-$version/Cargo.toml.orig2 \
	\| rq --input-toml --output-json \
	\| jq '
	def filter_allowed:
	select(.value.package // .key \| inside(env.allowed))
	;

	. as $root
	\| (.features \| keys \| map("[\(.)]") \| join(" ")) as $features
	\| .features = (
	(.features // {})
	\| map_values([ .[] \| select(
	(split("/")[0] \| "[\(.)]" \| inside($features))
	or
	(split("/")[0] \| "[\(.)]" \| inside(env.allowed))
	) ])
	)
	\| .features = (
	(.features // {}) + (
	(.dependencies // {})
	\| with_entries(
	select(.value.package // .key \| inside(env.allowed) \| not)
	\| .value = []
	)
	)
	)
	\| .dependencies = ((.dependencies // {}) \| with_entries(filter_allowed))
	\| .["build-dependencies"] = (
	(.["build-dependencies"] // {}) \| with_entries(filter_allowed)
	)
	\| .target = (
	(.target // {})
	\| map_values(
	.dependencies = (
	(.dependencies // {}) \| with_entries(filter_allowed)
	)
	\| .["build-dependencies"] = (
	(.["build-dependencies"] // {}) \| with_entries(filter_allowed)
	)
	)
	)
	' \
	\| rq --input-json --output-toml \
	> $tmp/$crate-$version/Cargo.toml
	rm -f $tmp/$crate-$version/Cargo.lock
	debug cargo update --manifest-path $tmp/$crate-$version/Cargo.toml

	uniq=${crate//-/_}_${version//[^0-9]/_}
	# Get the dependency tree and recursively rewrite them to get the hashes needed
	# to update this crate
	while IFS='\|' read -r subcrate alias subversion
	do
	if ! test $crate-$version = $subcrate-$subversion; then
	lhash="$(./publish $subcrate $subversion)"
	export ${uniq}_hash_${alias//-/_}=$lhash
	fi
	done < <(set -e; cargo metadata \
	--all-features \
	--format-version 1 \
	--manifest-path $tmp/$crate-$version/Cargo.toml \
	\| jq -r '
	. as $root
	\| (.packages[] \| select(.id == $root.resolve.root)) as $pkg
	\| .resolve.nodes[]
	\| select(.id == $root.resolve.root)
	\| .deps[]
	\| .pkg as $depid
	\| ($root.packages[] \| select(.id == $depid)) as $subpkg
	\| ($pkg.dependencies[] \| select(.name == $subpkg.name)) as $dep
	\| {
	name: $subpkg.name,
	rename: ($dep.rename // $dep.name),
	version: $subpkg.version
	}
	\| "\(.name)\|\(.rename)\|\(.version)"
	')

	# Add registry entries to all dependencies
	mv $tmp/$crate-$version/Cargo.toml $tmp/$crate-$version/Cargo.toml.orig3
	cat $tmp/$crate-$version/Cargo.toml.orig3 \
	\| rq --input-toml --output-json \
	\| env uniq=$uniq jq '
	def add_registry:
	($ENV["\(env.uniq)_hash_\(.key \| gsub("-"; "_"))"]) as $hash
	\| .value["registry-index"] = "\(env.IPFS_GATEWAY)/ipfs/\($hash)"
	;

	.dependencies = ((.dependencies // {}) \| with_entries(add_registry))
	\| .["build-dependencies"] = (
	(.["build-dependencies"] // {}) \| with_entries(add_registry)
	)
	\| .target = (
	(.target // {})
	\| map_values(
	.dependencies = (
	(.dependencies // {}) \| with_entries(add_registry)
	)
	\| .["build-dependencies"] = (
	(.["build-dependencies"] // {}) \| with_entries(add_registry)
	)
	)
	)
	' \
	\| rq --input-json --output-toml \
	> $tmp/$crate-$version/Cargo.toml
	rm -f $tmp/$crate-$version/Cargo.lock
	debug cargo update --manifest-path $tmp/$crate-$version/Cargo.toml

	# build crate then repackage it for reproducibility
	RUSTFLAGS='--cap-lints allow' debug cargo package --no-verify --manifest-path $tmp/$crate-$version/Cargo.toml
	mkdir -p $tmp/package
	tar xzf $tmp/$crate-$version/target/package/$crate-$version.crate -C $tmp/package
	tar czf $tmp/package/$crate-$version.crate --mtime="$(stat --format=%y $tmp/package/$crate-$version/Cargo.toml.orig)" --clamp-mtime --sort=name -C $tmp/package $crate-$version

	# Publish crate file to ipfs
	export crate_hash=$(sha256sum $tmp/package/$crate-$version.crate \| cut -d' ' -f 1)
	dl_hash=$(ipfs add --pin=false -wQ $tmp/package/$crate-$version.crate)

	# Inject a link from crate back to the dependencies indexes

	# Dunno how to programmatically make an empty dir dag node, so here's the hash
	# of one
	dir=QmUNLLsPACCz1vLxQVkXqqLX5R1X345qqfHbsf67hvA3Nn

	while IFS='=' read -r subcrate subhash
	do
	dir=$(ipfs object patch add-link $dir $subcrate $subhash)
	done < <(
	cat $tmp/$crate-$version/Cargo.toml \
	\| rq --input-toml --output-json \
	\| env uniq=$uniq jq -r '
	(., ((.target // {}) \| .[]))
	\| ((.dependencies // {}), (.["build-dependencies"] // {}))
	\| to_entries \| .[]
	\| .key
	\| "\(.)=\($ENV["\(env.uniq)_hash_\(. \| gsub("-"; "_"))"])"
	'
	)
	dl_hash=$(ipfs object patch add-link $dl_hash .deps $dir)

	# Generate index
	git init $tmp/index >&/dev/null
	cat <<END > $tmp/index/config.json
	{
	"dl": "$IPFS_GATEWAY/ipfs/$dl_hash/{crate}-{version}.crate"
	}
	END

	gen_index() {
	cargo metadata \
	--all-features \
	--format-version 1 \
	--manifest-path $tmp/$crate-$version/Cargo.toml \
	\| jq --compact-output '
	. as $root
	\| .packages[]
	\| select(.id == $root.resolve.root)
	\| {
	name,
	vers: .version,
	deps: [
	.dependencies[]
	\| select((.package // .name) \| inside(env.allowed))
	\| {
	name: (.rename // .name),
	package: (if .rename then .name else null end),
	req,
	features,
	optional,
	default_features: .uses_default_features,
	target,
	kind: (.kind // "normal"),
	registry,
	}
	],
	cksum: env.crate_hash,
	features,
	yanked: false,
	links: null
	}
	'
	}

	if test ${#crate} -eq 1; then
	mkdir -p $tmp/index/1
	gen_index > $tmp/index/1/$crate
	elif test ${#crate} -eq 2; then
	mkdir -p $tmp/index/2
	gen_index > $tmp/index/2/$crate
	elif test ${#crate} -eq 3; then
	mkdir -p $tmp/index/3/${crate:0:1}
	gen_index > $tmp/index/3/${crate:0:1}/$crate
	else
	mkdir -p $tmp/index/${crate:0:2}/${crate:2:2}
	gen_index > $tmp/index/${crate:0:2}/${crate:2:2}/$crate
	fi

	git -C $tmp/index add . >/dev/null
	GIT_COMMITTER_DATE="2000-01-01 00:00:00" git -C $tmp/index commit -am "Add $crate-$version" --date="2000-01-01 00:00:00" >&/dev/null

	git clone --bare $tmp/index $tmp/index-bare >&/dev/null
	git -C $tmp/index-bare remote remove origin >&/dev/null
	git -C $tmp/index-bare update-server-info >&/dev/null

	hash=$(ipfs add --pin=false -rQ $tmp/index-bare)

	rm -rf $tmp

	# Inject a link from index back to the crate node
	hash=$(ipfs object patch add-link $hash .crates $dl_hash)

	printf " %-40s dl => %s\n" "$crate-$version" "$dl_hash" >&2
	printf " %-40s index => %s\n" "$crate-$version" "$hash" >&2
	echo $dl_hash > $cache.dl
	echo $hash > $cache.index
	fi

	if test $root = $crate-$version
	then
	ipfs pin add $hash

	echo "
	$crate-$version published to $hash

	To use ensure you have this in your .cargo/config:

	[net]
	git-fetch-with-cli = true

	Then run

	cargo install $crate --index $IPFS_GATEWAY/ipfs/$hash

	"
	else
	echo $hash
	fi