This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import http.client | |
http.client.HTTPConnection.debuglevel = 1 |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# https://superuser.com/questions/1687960/over-ssh-can-you-use-the-same-private-key-on-the-host-side-for-other-purposes | |
alias sshagentssh='ssh-agent ssh -A -o AddKeysToAgent=yes' | |
# generate ssh key for github | |
# https://docs.github.com/en/authentication/connecting-to-github-with-ssh/generating-a-new-ssh-key-and-adding-it-to-the-ssh-agent | |
ssh-keygen -t ed25519 -b 4096 -C "[email protected]" -f ./id_ed25519 -N="" # -q | |
# https://stackoverflow.com/questions/4565700/how-to-specify-the-private-ssh-key-to-use-when-executing-shell-command-on-git | |
# https://github.com/settings/ssh/new | |
export GIT_SSH_COMMAND="ssh -o IdentitiesOnly=yes -i $PWD/id_ed25519" |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# Usage: python parquet2npyztsv.py test.npy data/train-*-of-*.parquet | |
# Usage: python parquet2npyztsv.py test.npz data/train-*-of-*.parquet | |
# Usage: python parquet2npyztsv.py test.tsv data/train-*-of-*.parquet | |
import sys | |
import numpy as np | |
import pyarrow.parquet as pq | |
output_path, *input_paths = sys.argv[1:] |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# Usage: bash git_lfs_clone_dedup.sh https://huggingface.co/deepseek-ai/DeepSeek-V3-0324 ~/DeepSeek-V3-0324 | |
# Usage: bash git_lfs_clone_dedup.sh [email protected]:deepseek-ai/DeepSeek-V3-0324 ~/DeepSeek-V3-0324 | |
# https://github.com/git-lfs/git-lfs/discussions/6029 | |
GIT_LFS_SKIP_SMUDGE=1 git clone $1 $2 | |
cd $2 | |
git lfs fetch | |
git lfs ls-files -l | while read SHA DASH FILEPATH; do rm "$FILEPATH" && ln ".git/lfs/objects/${SHA:0:2}/${SHA:2:2}/$SHA" "$FILEPATH"; done | |
#git lfs ls-files -l | while read SHA DASH FILEPATH; do mv ".git/lfs/objects/${SHA:0:2}/${SHA:2:2}/$SHA" "$FILEPATH"; done |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
sudo apt-get install git-lfs | |
git lfs install | |
# git clone https://huggingface.co/deepseek-ai/DeepSeek-V3-0324 | |
# du -sh DeepSeek-V3-0324 | |
# # 1.3T DeepSeek-V3-0324/ | |
# du -sh DeepSeek-V3-0324/.git/lfs | |
# # 642G DeepSeek-V3-0324/.git/lfs | |
# https://github.com/git-lfs/git-lfs/discussions/6029 |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
// based on simplified version of Python snippet: https://gist.github.com/vadimkantorov/b26eda3645edb13feaa62b874a3e7f6f | |
function yaml_loads(frontamtter_str) | |
{ | |
const procval = s => (s.length >= 2 && s[0] == '"' && s[s.length - 1] == '"') ? s.slice(1, s.length - 1) : (s.length >= 2 && s[0] == "'" && s[s.length - 1] == "'") ? s.slice(1, s.length - 1) : s; | |
for(const line of frontmatter_str.split('\n')) | |
{ | |
const line_strip = line.trim(); | |
const is_list_item = line_strip.startsWith('- '); |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
// based on https://github.com/tigt/mini-svg-data-uri/issues/24 | |
// Usage: cat myicon.svg | node svgdataurify.js | |
let svg = ""; | |
process.stdin.on("data", (chunk) => { svg += chunk; }); | |
process.stdin.on("end", async () => | |
{ | |
const reWhitespace = /\s+/g, reUrlHexPairs = /%[\dA-F]{2}/g, hexDecode = {'%20': ' ', '%3D': '=', '%3A': ':', '%2F': '/'}, specialHexDecode = match => hexDecode[match] || match.toLowerCase(); | |
if(svg.charCodeAt(0) === 0xfeff) svg = svg.slice(1); | |
svg = svg.trim().replace(reWhitespace, ' ').replaceAll('"', '\''); |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# from https://github.com/microsoft/WSL/issues/8151#issuecomment-2276363014 | |
curl -fsSL https://deb.nodesource.com/setup_22.x | sudo -E bash - | |
sudo apt-get install -y nodejs |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# prependfrontmatter ./index.html | |
alias prependfrontmatter="sed -i '1i---\n---'" | |
# https://unix.stackexchange.com/questions/99350/how-to-insert-text-before-the-first-line-of-a-file |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
# python citygeocoder.py > '~citygeocoder.json' | |
# https://www.wikidata.org/wiki/Wikidata:SPARQL_tutorial/en | |
# https://github.com/OSMNames/OSMNames, http://github.com/OSMNames/OSMNames/issues/208 | |
# https://osmnames.org/download/ | |
# https://stackoverflow.com/questions/74261733/how-to-fetch-gps-coordinates-of-worlds-largest-cities-from-wikidata-via-sparql | |
# FIXME: for some reason misses Helsinki | |
import sys | |
import json | |
import urllib.parse |
NewerOlder