notetoself - Snippets

2025-12-13

Inventorize folder contents > unique.file.txt

find . -type f -print0 \
| xargs -0 -P $(nproc) -I{} sh -c \
    'printf "%s %s %q\n" \
        "$(sha1sum "$1" | cut -d" " -f1)" \
        "$(stat -c "%s" "$1")" \
        "$(realpath "$1")"' \
    cmd {} \
| tee output.txt

see superuser | Advanced argument escaping with find + xargs and nested commands

files = [
    (sha, int(size), path) 
    for line in open("output.txt", errors="replace").readlines()
    if line.strip()
    for sha, size, path in (line.strip().split(maxsplit=2),)]

shas = {}
for sha, size, path in files: shas.setdefault(sha, (size, []))[1].append(path)

for sha, (size, paths) in list(sorted(shas.items(), reverse=True, key=lambda x: x[1][0] * len(x[1][1]))[:20]):
    print(f"{sha} {(size * len(paths))>>20}MB {size>>20}MB {len(paths)}")
    for p in paths:
        print(" ", p)
len(files)  # 737514
find . -iname \*.jpg -exec magick {}  -resize 1500x1500\> -quality 100 {} \;
find . -iname \*.jpg -exec jpegoptim -w10 --max=90 {} +
[uv run] ruff check . --isolated --select I <path/to/file>       [--fix]
poetry env use $(uv python list --only-installed 3.11 | awk '{print $2}')
jcmd $(pgrep -f /usr/bin/my-process) GC.heap_info | grep heap | awk '{total=$4; gsub("K","",total); used=$6; gsub("K","",used); mb_total=total/1024; mb_used=used/1024; pct=used/total*100; printf "Used: %.1f MB / %.1f MB (%.1f%%)\n", mb_used, mb_total, pct}'
jcmd $(pgrep -f /usr/share/java/jenkins.war) GC.heap_info | grep heap | awk '{total=$4; gsub("K","",total); used=$6; gsub("K","",used); mb_total=total/1024; mb_used=used/1024; pct=used/total*100; printf "Used: %.1f MB / %.1f MB (%.1f%%)\n", mb_used, mb_total, pct}'
while true; do \
    jcmd $(pgrep -f /usr/share/java/jenkins.war) \
      GC.heap_info \
    | grep heap \
    | awk '{total=$4; gsub("K","",total); used=$6; gsub("K","",used); mb_total=total/1024; mb_used=used/1024; pct=used/total*100; printf "Used: %.1f MB / %.1f MB (%.1f%%)\n", mb_used, mb_total, pct}'; \
    jstat -gc $(pgrep -f /usr/share/java/jenkins.war) | awk 'NR==2 {print "FGC: " $15}'; \
    sleep 1; \
done
java -cp /opt/sonatype/nexus-3.76.1-01/system/com/h2database/h2/2.3.232/h2-2.3.232.jar org.h2.tools.Shell -url jdbc:h2:/opt/sonatype/sonatype-work/nexus3/db/nexus -sql "SHUTDOWN DEFRAG"
command = """
find <SRC> ! -type d -print0 | sed -z "s|^<SRC>/||" | xargs -0 -I{} sh -c \\
    'mkdir -p <DST>/$(dirname "$1") && cp <SRC>/"$1" <DST>/$(dirname "$1")' \\
    subst {}
""".format(src=ctx.file.src.path, dst=output_dir.path)
bazel cquery @pnp4nagios//:build --output=starlark --starlark:expr="[f for f in target.output_groups]"
while true; do \
  inotifywait -q -r -e modify,create,move \
    --exclude '\.git|__pycache__|\.mypy_cache|build|\.venv|\.goutputstream' \
    --format '%w%f' .; \
    uv run pre-commit run --hook-stage pre-commit --all-files \
    && uv run examples/example.yaml;\
  done
echo | openssl s_client -connect om-office.de:443 -servername om-office.de 2>/dev/null | openssl x509 -noout -dates
bazel run //:format $(git diff --name-only HEAD^)
make -C tests test-unit \
| egrep --color=auto -i "|assertionerror|crash|error|unexpected|cannot|cancel|abort|failure|failed|timeout|exception|fatal"
while true; do \
    echo "$(date '+%Y-%m-%d %H:%M:%S') | $(free -m | awk '/Mem:/ {printf "Total: %dMB | Used: %dMB | Free: %dMB | Used: %.1f%%", $2, $3, $4, $3/$2*100}')"; \
    sleep 10; \
done
find "${BASE_PATH}" -type d -name __pycache__ \ 
  | awk '{print length, $0}' | sort -n -r | cut -d' ' -f2- \
  | xargs -I{} sh -c 'rm -rf "$1"' cmd {}
find "${BASE_PATH}" -type d \
  | awk '{print length, $0}' | sort -n -r | cut -d' ' -f2- \
  | xargs -I{} sh -c 'rmdir "$1"' cmd {}
git ls-files --others --ignored --exclude-standard

git diff-tree --no-commit-id --name-only -r HEAD # touched files in HEAD - with removed files git diff --name-only HEAD # locally modified cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u .venv/bin/pytest -svv --doctest-modules $(cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u) .venv/bin/ruff format $(cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u) .venv/bin/mypy $(cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u) .venv/bin/ruff check --fix $(cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u)

find . \( -name ".ruff_cache" -o -name ".pytest_cache" -o -name "__pycache__" -o -name ".mypy_cache" \) -exec rm -rf {} \;

fpr = !"f() { git switch -c "GH-$1-merge" origin/master | curl "https://patch-diff.githubusercontent.com/raw/checkmk/checkmk/pull/$1.patch\" | git am -; }; f" gpr = !"f() { git push origin HEAD:refs/for/master%topic=$(git rev-parse --abbrev-ref HEAD); }; f"

Page source Inventorize folder contents > `unique.file.txt` ```bash find . -type f -print0 \ | xargs -0 -P $(nproc) -I{} sh -c \ 'printf "%s %s %q\n" \ "$(sha1sum "$1" | cut -d" " -f1)" \ "$(stat -c "%s" "$1")" \ "$(realpath "$1")"' \ cmd {} \ | tee output.txt ``` see [superuser | Advanced argument escaping with find + xargs and nested commands](https://superuser.com/questions/1864471) ```python files = [ (sha, int(size), path) for line in open("output.txt", errors="replace").readlines() if line.strip() for sha, size, path in (line.strip().split(maxsplit=2),)] shas = {} for sha, size, path in files: shas.setdefault(sha, (size, []))[1].append(path) for sha, (size, paths) in list(sorted(shas.items(), reverse=True, key=lambda x: x[1][0] * len(x[1][1]))[:20]): print(f"{sha} {(size * len(paths))>>20}MB {size>>20}MB {len(paths)}") for p in paths: print(" ", p) len(files) # 737514 ``` ```bash find . -iname \*.jpg -exec magick {} -resize 1500x1500\> -quality 100 {} \; find . -iname \*.jpg -exec jpegoptim -w10 --max=90 {} + ``` ```sh [uv run] ruff check . --isolated --select I <path to="" file=""> [--fix] ``` ```sh poetry env use $(uv python list --only-installed 3.11 | awk '{print $2}') ``` ```sh jcmd $(pgrep -f /usr/bin/my-process) GC.heap_info | grep heap | awk '{total=$4; gsub("K","",total); used=$6; gsub("K","",used); mb_total=total/1024; mb_used=used/1024; pct=used/total*100; printf "Used: %.1f MB / %.1f MB (%.1f%%)\n", mb_used, mb_total, pct}' ``` ``` jcmd $(pgrep -f /usr/share/java/jenkins.war) GC.heap_info | grep heap | awk '{total=$4; gsub("K","",total); used=$6; gsub("K","",used); mb_total=total/1024; mb_used=used/1024; pct=used/total*100; printf "Used: %.1f MB / %.1f MB (%.1f%%)\n", mb_used, mb_total, pct}' ``` ```sh while true; do \ jcmd $(pgrep -f /usr/share/java/jenkins.war) \ GC.heap_info \ | grep heap \ | awk '{total=$4; gsub("K","",total); used=$6; gsub("K","",used); mb_total=total/1024; mb_used=used/1024; pct=used/total*100; printf "Used: %.1f MB / %.1f MB (%.1f%%)\n", mb_used, mb_total, pct}'; \ jstat -gc $(pgrep -f /usr/share/java/jenkins.war) | awk 'NR==2 {print "FGC: " $15}'; \ sleep 1; \ done ``` ```sh java -cp /opt/sonatype/nexus-3.76.1-01/system/com/h2database/h2/2.3.232/h2-2.3.232.jar org.h2.tools.Shell -url jdbc:h2:/opt/sonatype/sonatype-work/nexus3/db/nexus -sql "SHUTDOWN DEFRAG" ``` ``` command = """ find <SRC> ! -type d -print0 | sed -z "s|^<SRC>/||" | xargs -0 -I{} sh -c \\ 'mkdir -p <DST>/$(dirname "$1") && cp <SRC>/"$1" <DST>/$(dirname "$1")' \\ subst {} """.format(src=ctx.file.src.path, dst=output_dir.path) ``` ``` bazel cquery @pnp4nagios//:build --output=starlark --starlark:expr="[f for f in target.output_groups]" ``` ```sh while true; do \ inotifywait -q -r -e modify,create,move \ --exclude '\.git|__pycache__|\.mypy_cache|build|\.venv|\.goutputstream' \ --format '%w%f' .; \ uv run pre-commit run --hook-stage pre-commit --all-files \ && uv run examples/example.yaml;\ done ``` ``` echo | openssl s_client -connect om-office.de:443 -servername om-office.de 2>/dev/null | openssl x509 -noout -dates ``` ``` bazel run //:format $(git diff --name-only HEAD^) ``` ``` make -C tests test-unit \ | egrep --color=auto -i "|assertionerror|crash|error|unexpected|cannot|cancel|abort|failure|failed|timeout|exception|fatal" ``` ``` while true; do \ echo "$(date '+%Y-%m-%d %H:%M:%S') | $(free -m | awk '/Mem:/ {printf "Total: %dMB | Used: %dMB | Free: %dMB | Used: %.1f%%", $2, $3, $4, $3/$2*100}')"; \ sleep 10; \ done ``` ``` find "${BASE_PATH}" -type d -name __pycache__ \ | awk '{print length, $0}' | sort -n -r | cut -d' ' -f2- \ | xargs -I{} sh -c 'rm -rf "$1"' cmd {} find "${BASE_PATH}" -type d \ | awk '{print length, $0}' | sort -n -r | cut -d' ' -f2- \ | xargs -I{} sh -c 'rmdir "$1"' cmd {} ``` ``` git ls-files --others --ignored --exclude-standard ``` git diff-tree --no-commit-id --name-only -r HEAD # touched files in HEAD - with removed files git diff --name-only HEAD # locally modified cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u .venv/bin/pytest -svv --doctest-modules $(cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u) .venv/bin/ruff format $(cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u) .venv/bin/mypy $(cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u) .venv/bin/ruff check --fix $(cat <(git diff --name-only --diff-filter=d) <(git diff --name-only --diff-filter=d HEAD~1 HEAD) | sort -u) ``` find . \( -name ".ruff_cache" -o -name ".pytest_cache" -o -name "__pycache__" -o -name ".mypy_cache" \) -exec rm -rf {} \; ``` fpr = !"f() { git switch -c "GH-$1-merge" origin/master | curl \"https://patch-diff.githubusercontent.com/raw/checkmk/checkmk/pull/$1.patch\" | git am -; }; f" gpr = !"f() { git push origin HEAD:refs/for/master%topic=$(git rev-parse --abbrev-ref HEAD); }; f" </DST></SRC></DST></SRC></SRC></path>