Last active
January 2, 2025 17:50
-
-
Save dustingetz/681dcbf16d104b1496a29f2f08965fc8 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| (ns dustingetz.datafy-fs | |
| "nav implementation for java file system traversals" | |
| (:require [clojure.core.protocols :as ccp :refer [nav]] | |
| [clojure.datafy :refer [datafy]] ; tests only | |
| [clojure.spec.alpha :as s] | |
| [contrib.assert :refer [check]] | |
| [dustingetz.datafy-fs :as fs] | |
| [hyperfiddle.rcf :refer [tests]] | |
| [clojure.java.io :as io]) | |
| (:import [java.nio.file Path Paths Files] | |
| java.io.File | |
| java.nio.file.LinkOption | |
| [java.nio.file.attribute BasicFileAttributes FileTime] | |
| [org.apache.tika Tika] ; mime type detection | |
| )) | |
| ; spec the data, not the object | |
| (s/def ::name string?) | |
| (s/def ::absolute-path string?) | |
| (s/def ::modified inst?) | |
| (s/def ::created inst?) | |
| (s/def ::accessed inst?) | |
| (s/def ::size string?) | |
| ;; (s/def ::kind (s/nilable qualified-keyword?)) | |
| (s/def ::kind qualified-keyword?) ;; HACK FIXME implement nilable in hyperfiddle.spec | |
| (s/def ::file (s/keys :opt [::name ::absolute-path ::modified ::created ::accessed ::size ::kind])) | |
| (s/def ::children (s/coll-of ::file)) | |
| (defn get-extension [?path] | |
| (when ?path | |
| (when-not (= \. (first ?path)) ; hidden | |
| (some-> (last (re-find #"(\.[a-zA-Z0-9]+)$" ?path)) | |
| (subs 1))))) | |
| (tests | |
| "get-extension" | |
| (get-extension nil) := nil | |
| (get-extension "") := nil | |
| (get-extension ".") := nil | |
| (get-extension "..") := nil | |
| (get-extension "image") := nil | |
| (get-extension "image.") := nil | |
| (get-extension "image..") := nil | |
| (get-extension "image.png") := "png" | |
| (get-extension "image.blah.png") := "png" | |
| (get-extension "image.blah..png") := "png" | |
| (get-extension ".gitignore") := nil) | |
| (comment | |
| "java.io.File interop" | |
| (def h (clojure.java.io/file "src")) | |
| (sort (.listFiles h)) | |
| (.getName h) := "src" | |
| (.getPath h) := "src" | |
| (.isDirectory h) := true | |
| (.isFile h) := false | |
| ;(.getParent h) := nil -- ?? | |
| ;(.getParentFile h) := nil -- ?? | |
| (-> (datafy java.io.File) :members keys) | |
| (->> (seq (.listFiles h)) (take 1) first datafy) | |
| (for [x (take 5 (.listFiles h))] (.getName x))) | |
| (defn file-path "get java.nio.file.Path of j.n.f.File" | |
| [^File f] (-> f .getAbsolutePath (java.nio.file.Paths/get (make-array String 0)))) | |
| (tests | |
| (def p (file-path (clojure.java.io/file "src"))) | |
| (instance? Path p) := true | |
| (-> (datafy Path) :members keys) | |
| (-> p .getRoot str) := "/" | |
| (-> p .getFileName str) := "src" | |
| (-> p .getParent .getFileName str) := "electric-fiddle" | |
| (-> p .getParent .toFile .getName) := "electric-fiddle" | |
| #_(-> p .getParent .toFile datafy)) | |
| (defn path-attrs [^Path p] | |
| (Files/readAttributes p BasicFileAttributes (make-array java.nio.file.LinkOption 0))) | |
| (tests | |
| (def attrs (path-attrs (file-path (clojure.java.io/file "src")))) | |
| (instance? BasicFileAttributes attrs) := true | |
| (.isDirectory attrs) := true | |
| (.isSymbolicLink attrs) := false | |
| (.isRegularFile attrs) := false | |
| (.isOther attrs) := false) | |
| (defn file-attrs [^File f] (path-attrs (file-path f))) | |
| (tests | |
| (file-attrs (clojure.java.io/file "src")) | |
| ) | |
| (def ... `...) ; define a value for easy test assertions | |
| (extend-protocol ccp/Datafiable | |
| java.nio.file.attribute.FileTime | |
| (datafy [o] (-> o .toInstant java.util.Date/from))) | |
| (defonce TIKA (org.apache.tika.Tika.)) | |
| (defn detect-mime-type [^File file] (.detect TIKA file)) | |
| (defn detect-mime-type-no-access [^String file-name] (.detect TIKA file-name)) | |
| (defmulti datafy-file-content detect-mime-type) | |
| (defmethod datafy-file-content "text/plain" [^File f] (line-seq (io/reader f))) | |
| (defmethod datafy-file-content :default [^File f] (io/reader f)) | |
| (extend-protocol ccp/Datafiable | |
| java.io.File | |
| (datafy [^File f] | |
| ; represent object's top layer as EDN-ready value records, for display | |
| ; datafy is partial display view of an object as value records | |
| ; nav is ability to resolve back to the underlying object pointers | |
| ; they compose to navigate display views of objects like a link | |
| (let [attrs (file-attrs f) | |
| n (.getName f) | |
| mime-type (detect-mime-type-no-access n)] | |
| (as-> {::name n | |
| ::kind (cond (.isDirectory attrs) ::dir | |
| (.isSymbolicLink attrs) ::symlink | |
| (.isOther attrs) ::other | |
| (.isRegularFile attrs) (if-let [s (get-extension n)] | |
| (keyword (namespace ::foo) s) | |
| ::unknown-kind) | |
| () ::unknown-kind) | |
| ::absolute-path (-> f .toPath .normalize .toAbsolutePath str) | |
| ::created (-> attrs .creationTime .toInstant java.util.Date/from) | |
| ::accessed (-> attrs .lastAccessTime .toInstant java.util.Date/from) | |
| ::modified (-> attrs .lastModifiedTime .toInstant java.util.Date/from) | |
| ::size (.size attrs) | |
| ::mime-type mime-type} % | |
| (merge % (if (= ::dir (::kind %)) | |
| {::children (lazy-seq (sort (.listFiles f))) | |
| ::parent `...})) | |
| (with-meta % {`ccp/nav | |
| (fn [xs k v] | |
| (case k | |
| ; reverse data back to object, to be datafied again by caller | |
| ::modified (.lastModifiedTime attrs) | |
| ::created (.creationTime attrs) | |
| ::accessed (.lastAccessTime attrs) | |
| ::children (some-> v vec) | |
| ::parent (-> f file-path .getParent .toFile) | |
| ::content (datafy-file-content f) | |
| v))}))))) | |
| (tests | |
| ; careful, calling seq loses metas on the underlying | |
| (def h (clojure.java.io/file "src-contrib/")) | |
| (type h) := java.io.File | |
| "(datafy file) returns an EDN-ready data view that is one layer deep" | |
| (datafy h) | |
| := #:dustingetz.datafy-fs | |
| {:name "src-contrib", | |
| :absolute-path _, | |
| :size _, | |
| :modified _, | |
| :created _, | |
| :accessed _, | |
| :kind ::dir, | |
| :children _ | |
| :parent ...}) | |
| (tests | |
| "datafy of a directory includes a Clojure coll of children, but child elements are native file | |
| objects" | |
| (as-> (datafy h) % | |
| (nav % ::children (::children %)) | |
| (datafy %) | |
| (take 2 (map type %))) | |
| := [java.io.File java.io.File] | |
| "nav to a leaf returns the native object" | |
| (as-> (datafy h) % | |
| (nav % ::modified (::modified %))) | |
| (type *1) := java.nio.file.attribute.FileTime | |
| "datafy again to get the plain value" | |
| (type (datafy *2)) := java.util.Date) | |
| (tests | |
| (as-> (datafy h) % | |
| (nav % ::children (::children %)) | |
| (datafy %) ; can skip - simple data | |
| (map datafy %) | |
| (vec (filter #(= (::name %) "contrib") %)) ; stabilize test | |
| (nav % 0 (% 0)) | |
| (datafy %) | |
| #_(s/conform ::file %)) | |
| := {::name "contrib", | |
| ::absolute-path _, | |
| ::size _, | |
| ::modified _, | |
| ::created _, | |
| ::accessed _, | |
| ::kind ::dir, | |
| ::children _ | |
| ::parent ...}) | |
| (tests | |
| "nav into children and back up via parent ref" | |
| (def m (datafy h)) | |
| (::name m) := "src-contrib" | |
| (as-> m % | |
| (nav % ::children (::children %)) | |
| (datafy %) ; dir | |
| (nav % 0 (get % 0)) ; first file in dir | |
| (datafy %) | |
| (nav % ::parent (::parent %)) ; dir (skip level on way up) | |
| (datafy %) | |
| (::name %)) | |
| := "src-contrib") | |
| (defn absolute-path [^String path-str & more] | |
| (-> (java.nio.file.Path/of ^String path-str (into-array String more)) | |
| .normalize .toAbsolutePath str)) | |
| (comment | |
| (absolute-path "./") := "/Users/dustin/src/hf/electric-fiddle" | |
| (absolute-path "node_modules") := "/Users/dustin/src/hf/electric-fiddle/node_modules" | |
| (clojure.java.io/file (absolute-path "./")) | |
| (clojure.java.io/file (absolute-path "node_modules"))) | |
| (defn relativize-path "Convert an absolute path to one relative to base-dir" | |
| [base-dir abs-path] | |
| (let [base (.toPath (clojure.java.io/file (check base-dir))) | |
| full (.toPath (clojure.java.io/file (check abs-path)))] | |
| (when (-> full .normalize (.startsWith (.normalize base))) | |
| (str (.relativize (.normalize base) (.normalize full)))))) | |
| (tests | |
| (relativize-path (absolute-path "./") (absolute-path "./vendor/electric/src")) := "vendor/electric/src" | |
| (relativize-path (absolute-path "./") (absolute-path "./vendor/electric/src/")) := "vendor/electric/src" | |
| (relativize-path (absolute-path "./") (absolute-path "vendor/electric/src")) := "vendor/electric/src" | |
| (relativize-path (absolute-path "./") (absolute-path "vendor/electric/src/")) := "vendor/electric/src" | |
| (relativize-path (absolute-path "../") (absolute-path "vendor/electric/src")) := "electric-fiddle/vendor/electric/src" | |
| (relativize-path (absolute-path "./") (absolute-path "./")) := "" | |
| (relativize-path (absolute-path "./") (absolute-path "")) := "" | |
| (relativize-path (absolute-path "./") (absolute-path "../")) := nil | |
| (relativize-path "/fake/" (absolute-path "./src")) := nil | |
| (relativize-path (absolute-path "./") "/fake/") := nil | |
| (relativize-path (absolute-path "./") "fake") := nil) | |
| (s/fdef list-files :args (s/cat :file any?) :ret (s/coll-of any?)) | |
| (defn list-files [^String path-str] | |
| (try (let [m (datafy (clojure.java.io/file path-str))] | |
| (nav m ::children (::children m))) | |
| (catch java.nio.file.NoSuchFileException _))) | |
| (comment | |
| (list-files (absolute-path "./")) | |
| (list-files (absolute-path "node_modules"))) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment