Files
logseq/src/test/frontend/db/query_dsl_test.cljs
Gabriel Horner 039da828ac enhance: infer property schema and add new-pages from properties
for sqlite-build graphs. Also fixed numbered page query not working for
db graphs and related tests
2024-06-07 12:10:15 -04:00

656 lines
22 KiB
Clojure

(ns frontend.db.query-dsl-test
(:require [cljs.test :refer [are deftest testing use-fixtures is]]
[clojure.string :as str]
[logseq.common.util.page-ref :as page-ref]
[frontend.db :as db]
[frontend.util :as util]
[frontend.db.query-dsl :as query-dsl]
[frontend.test.helper :as test-helper :include-macros true :refer [load-test-files]]))
;; TODO: quickcheck
;; 1. generate query filters
;; 2. find illegal queries which can't be executed by datascript
;; 3. find filters combinations which might break the current query implementation
(use-fixtures :each {:before test-helper/start-test-db!
:after test-helper/destroy-test-db!})
;; Test helpers
;; ============
(def dsl-query*
"When $EXAMPLE set, prints query result of build query. Useful for
documenting examples and debugging"
(if (some? js/process.env.EXAMPLE)
(fn dsl-query-star [& args]
(let [old-build-query query-dsl/build-query]
(with-redefs [query-dsl/build-query
(fn [& args']
(let [res (apply old-build-query args')]
(println "EXAMPLE:" (pr-str (:query res)))
res))]
(apply query-dsl/query args))))
query-dsl/query))
(defn- dsl-query
[s]
(db/clear-query-state!)
(when-let [result (dsl-query* test-helper/test-db s)]
(map first (deref result))))
(defn- custom-query
[query]
(db/clear-query-state!)
(when-let [result (query-dsl/custom-query test-helper/test-db query {})]
(map first (deref result))))
;; Tests
;; =====
(deftest pre-transform-test
(testing "page references should be quoted and tags should be handled"
(are [x y] (= (query-dsl/pre-transform x) y)
"#foo"
"#tag foo"
"(and #foo)"
"(and #tag foo)"
"[[test #foo]]"
"\"[[test #foo]]\""
"(and [[test #foo]] (or #foo))"
"(and \"[[test #foo]]\" (or #tag foo))"
"\"for #clojure\""
"\"for #clojure\""
"(and \"for #clojure\")"
"(and \"for #clojure\")"
"(and \"for #clojure\" #foo)"
"(and \"for #clojure\" #tag foo)")))
(defn- testable-content
"Only test :block/content up to page-ref as page-ref content varies between db and file graphs"
[{:block/keys [content]}]
(some->> content
(re-find #"[^\[]+")
str/trim))
(defn- block-property-queries-test
[]
(load-test-files [{:file/path "journals/2022_02_28.md"
:file/content "a:: b
- b1
prop-a:: val-a
prop-num:: 2000
- b2
prop-a:: val-a
prop-b:: val-b
- b3
prop-d:: [[no-space-link]]
prop-c:: [[page a]], [[page b]], [[page c]]
prop-linked-num:: [[3000]]
- b4
prop-d:: [[nada]]"}])
(testing "Blocks have given property value"
(is (= #{"b1" "b2"}
(set (map (comp first str/split-lines :block/content)
(dsl-query "(property prop-a val-a)")))))
(is (= ["b2"]
(map (comp first str/split-lines :block/content)
(dsl-query "(property prop-b val-b)")))))
(is (= ["b2"]
(map (comp first str/split-lines :block/content)
(dsl-query "(and (property prop-b val-b))")))
"Blocks have property value with empty AND")
(is (= ["b3"]
(map (comp first str/split-lines :block/content)
(dsl-query "(and (property prop-c \"page c\"))")))
"Blocks have property value from a set of values")
;; TODO: optimize
(is (= ["b3"]
(map (comp first str/split-lines :block/content)
(dsl-query "(and (property prop-c \"page c\") (property prop-c \"page b\"))")))
"Blocks have ANDed property values")
(is (= #{"b2" "b3"}
(set
(map (comp first str/split-lines :block/content)
(dsl-query "(or (property prop-c \"page c\") (property prop-b val-b))"))))
"Blocks have ORed property values")
;; FIXME: Once :number property approach resolved
#_(is (= ["b1"]
(map (comp first str/split-lines :block/content)
(dsl-query "(property prop-num 2000)")))
"Blocks have integer property value")
(is (= ["b3"]
(map (comp first str/split-lines :block/content)
(dsl-query "(property prop-linked-num 3000)")))
"Blocks have property with integer page value")
(is (= ["b3"]
(map (comp first str/split-lines :block/content)
(dsl-query "(property prop-d no-space-link)")))
"Blocks have property value with no space")
(is (= ["b3" "b4"]
(map (comp first str/split-lines :block/content)
(dsl-query "(property prop-d)")))
"Blocks that have a property"))
(deftest ^:done block-property-queries
(testing "block property tests with default config"
(test-helper/with-config {}
(block-property-queries-test))))
(deftest ^:done block-property-query-performance
(let [pages (->> (repeat 10 {:tags ["tag1" "tag2"]})
(map-indexed (fn [idx {:keys [tags]}]
{:file/path (str "pages/page" idx ".md")
:file/content (if (seq tags)
(str "page-prop:: b\n- block for page" idx
"\ntagz:: " (str/join ", " (map page-ref/->page-ref tags)))
"")})))
_ (load-test-files pages)
{:keys [result time]}
(util/with-time (dsl-query "(and (property tagz tag1) (property tagz tag2))"))]
;; Specific number isn't as important as ensuring query doesn't take orders
;; of magnitude longer
(is (> 40.0 time) "multi property query perf is reasonable")
(is (= 10 (count result)))))
(defn- page-property-queries-test
[]
(load-test-files [{:file/path "pages/page1.md"
:file/content "parent:: [[child page 1]], [[child-no-space]]\ninteresting:: true"}
{:file/path "pages/page2.md"
:file/content "foo:: #bar\ninteresting:: false"}
{:file/path "pages/page3.md"
:file/content "parent:: [[child page 1]], [[child page 2]]\nfoo:: bar\ninteresting:: false"}
{:file/path "pages/page4.md"
:file/content "parent:: [[child page 2]]\nfoo:: baz"}])
(is (= ["page1" "page3" "page4"]
(map :block/name (dsl-query "(page-property parent)")))
"Pages have given property")
(is (= ["page1" "page3"]
(map :block/name (dsl-query "(page-property parent [[child page 1]])")))
"Pages have property value that is a page and query is a page")
(is (= ["page1" "page3"]
(map :block/name (dsl-query "(page-property parent \"child page 1\")")))
"Pages have property value that is a page and query is a string")
(is (= ["page1"]
(map :block/name (dsl-query "(page-property parent [[child-no-space]])")))
"Pages have property value that is a page with no spaces")
(is (= ["page3"]
(map
:block/name
(dsl-query "(and (page-property parent [[child page 1]]) (page-property parent [[child page 2]]))")))
"Page property queries ANDed")
(is (= ["page1" "page3" "page4"]
(map
:block/name
(dsl-query "(or (page-property parent [[child page 1]]) (page-property parent [[child page 2]]))")))
"Page property queries ORed")
(is (= ["page1" "page3"]
(map :block/name
(dsl-query "(and (page-property parent [[child page 1]]) (or (page-property interesting true) (page-property parent [[child page 2]])))"))))
(is (= ["page4"]
(map
:block/name
(dsl-query "(and (page-property parent [[child page 2]]) (not (page-property foo bar)))")))
"Page property queries nested NOT in second clause")
(is (= ["page4"]
(map
:block/name
(dsl-query "(and (not (page-property foo bar)) (page-property parent [[child page 2]]))")))
"Page property queries nested NOT in first clause")
(testing "boolean values"
(is (= ["page1"]
(map :block/name (dsl-query "(page-property interesting true)")))
"Boolean true")
(is (= ["page2" "page3"]
(map :block/name (dsl-query "(page-property interesting false)")))
"Boolean false")))
(deftest page-property-queries
(testing "page property tests with default config"
(test-helper/with-config {}
(page-property-queries-test))))
(deftest task-queries
(load-test-files [{:file/path "pages/page1.md"
:file/content "foo:: bar
- NOW b1
- TODO b2
- LATER b3
- LATER [#A] b4
- LATER [#B] b5"}])
(testing "Lowercase query"
(is (= ["NOW b1"]
(map :block/content (dsl-query "(task now)"))))
(is (= ["LATER b3" "LATER [#A] b4" "LATER [#B] b5"]
(map :block/content (dsl-query "(task later)")))))
(is (= ["LATER b3" "LATER [#A] b4" "LATER [#B] b5"]
(map :block/content (dsl-query "(task LATER)")))
"Uppercase query")
(testing "Multiple specified tasks results in ORed results"
(is (= ["NOW b1" "LATER b3" "LATER [#A] b4" "LATER [#B] b5"]
(map :block/content (dsl-query "(task now later)"))))
(is (= ["NOW b1" "LATER b3" "LATER [#A] b4" "LATER [#B] b5"]
(map :block/content (dsl-query "(task [now later])")))
"Multiple arguments specified with vector notation"))
(is (= ["NOW b1" "LATER [#A] b4"]
(map :block/content
(dsl-query "(or (todo now) (and (todo later) (priority a)))")))
"Multiple boolean operators with todo and priority operators")
(is (= ["LATER [#A] b4" "LATER [#B] b5"]
(map :block/content
(dsl-query "(and (todo later) (or (priority a) (priority b)))")))))
(deftest sample-queries
(load-test-files [{:file/path "pages/page1.md"
:file/content "foo:: bar
- TODO b1
- TODO b2"}])
(is (= 1
(count (dsl-query "(and (task todo) (sample 1))")))
"Correctly limits block results")
(is (= 1
(count (dsl-query "(and (page-property foo) (sample 1))")))
"Correctly limits page results"))
(deftest priority-queries
(load-test-files [{:file/path "pages/page1.md"
:file/content "foo:: bar
- [#A] b1
- [#B] b2
- [#A] b3"}])
(testing "one arg queries"
(is (= ["[#A] b1" "[#A] b3"]
(map :block/content (dsl-query "(priority A)"))))
(is (= ["[#A] b1" "[#A] b3"]
(map :block/content (dsl-query "(priority a)")))))
(testing "two arg queries"
(is (= ["[#A] b1" "[#B] b2" "[#A] b3"]
(map :block/content (dsl-query "(priority a b)"))))
(is (= ["[#A] b1" "[#B] b2" "[#A] b3"]
(map :block/content (dsl-query "(priority [a b])")))
"Arguments with vector notation"))
(is (= ["[#A] b1" "[#B] b2" "[#A] b3"]
(map :block/content (dsl-query "(priority a b c)")))
"Three arg queries and args that have no match"))
(deftest ^:done nested-boolean-queries
(load-test-files [{:file/path "pages/page1.md"
:file/content "foo:: bar
- DONE b1 [[page 1]] [[page 3]]
- DONE b2Z [[page 1]]"}
{:file/path "pages/page2.md"
:file/content "foo:: bar
- NOW b3 [[page 1]]
- LATER b4Z [[page 2]]
"}])
(let [task-filter (if js/process.env.DB_GRAPH "(todo doing todo)" "(todo now later)")]
(is (= []
(dsl-query "(and (todo done) (not [[page 1]]))")))
(is (= ["DONE b1"]
(map testable-content
(dsl-query "(and [[page 1]] (and [[page 3]] (not (task todo))))")))
"Nested not")
(is (= ["NOW b3" "LATER b4Z"]
(map testable-content
(dsl-query (str "(and " task-filter " (or [[page 1]] [[page 2]]))")))))
(is (= #{"NOW b3"
"LATER b4Z"
"DONE b1"
"DONE b2Z"}
(set (map testable-content
(dsl-query (str "(and "
(if js/process.env.DB_GRAPH "(todo doing todo done)" "(todo now later done)")
" (or [[page 1]] (not [[page 1]])))"))))))
(is (= (if js/process.env.DB_GRAPH #{"bar" "DONE b1" "DONE b2Z"} #{"foo:: bar" "DONE b1" "DONE b2Z"})
(->> (dsl-query (str "(not (and " task-filter " (or [[page 1]] [[page 2]])))"))
(keep testable-content)
set)))
(is (= #{"DONE b2Z" "LATER b4Z"}
(->> (dsl-query "(and \"Z\" (or \"b2\" \"b4\"))")
(keep testable-content)
set))
"AND-OR with full text search"))
;; FIXME: not working
;; Requires or-join and not-join which aren't supported yet
; (is (= []
; (dsl-query "(or (priority a) (not (priority c)))")))
)
(deftest ^:done page-tags-and-all-page-tags-queries
(load-test-files
[{:file/path "pages/page1.md"
:file/content "tags:: [[page-tag-1]], [[page-tag-2]]"}
{:file/path "pages/page2.md"
:file/content "tags:: [[page-tag-2]], [[page-tag-3]]"}
{:file/path "pages/page3.md"
:file/content "tags:: [[other]]"}])
(are [x y] (= (set y) (set (map :block/name (dsl-query x))))
"(page-tags [[page-tag-1]])"
["page1"]
"(page-tags page-tag-2)"
["page1" "page2"]
"(page-tags page-tag-1 page-tag-2)"
["page1" "page2"]
"(page-tags page-TAG-1 page-tag-2)"
["page1" "page2"]
"(page-tags [page-tag-1 page-tag-2])"
["page1" "page2"]
"(all-page-tags)"
["page-tag-1" "page-tag-2" "page-tag-3" "other"]))
(deftest block-content-query
(load-test-files [{:file/path "pages/page1.md"
:file/content "- b1 Hit\n- b2 Another"}])
(is (= ["b1 Hit"]
(map :block/content (dsl-query "\"Hit\""))))
(is (= []
(map :block/content (dsl-query "\"miss\"")))
"Correctly returns no results"))
(deftest page-queries
(load-test-files [{:file/path "pages/page1.md"
:file/content "foo"}
{:file/path "pages/page2.md"
:file/content "bar"}])
(is (= ["page1"]
(map #(get-in % [:block/page :block/name])
(dsl-query "(page page1)"))))
(is (= []
(map #(get-in % [:block/page :block/name])
(dsl-query "(page nope)")))
"Correctly returns no results"))
(deftest ^:done empty-queries
(testing "nil or blank strings should be ignored"
(are [x] (nil? (dsl-query x))
nil
""
" "
"\"\"")))
(deftest ^:done page-ref-and-boolean-queries
(load-test-files [{:file/path "pages/page1.md"
:file/content "foo:: bar
- b1 [[page 1]] [[tag2]]
- b2 [[page 2]] [[tag1]]
- b3"}])
(testing "page-ref queries"
(is (= ["b2"]
(map testable-content (dsl-query "[[page 2]]")))
"Page ref arg")
(is (= ["b2"]
(map testable-content (dsl-query "#tag1")))
"Tag arg")
(is (= []
(dsl-query "[[blarg]]"))
"Nonexistent page returns no results"))
(testing "basic boolean queries"
(is (= ["b2"]
(map testable-content
(dsl-query "(and [[tag1]] [[page 2]])")))
"AND query")
(is (= ["b1" "b2"]
(map testable-content
(dsl-query "(or [[tag2]] [[page 2]])")))
"OR query")
(is (= ["b1"]
(map testable-content
(dsl-query "(or [[tag2]] [[page 3]])")))
"OR query with nonexistent page should return meaningful results")
(is (= (if js/process.env.DB_GRAPH #{"b1" "bar" "b3"} #{"b1" "foo:: bar" "b3"})
(->> (dsl-query "(not [[page 2]])")
;; Only filter to page1 to get meaningful results
(filter #(= "page1" (get-in % [:block/page :block/name])))
(map testable-content)
(set)))
"NOT query")))
(deftest ^:done nested-page-ref-queries
(load-test-files (if js/process.env.DB_GRAPH
[{:page {:block/original-name "page1"}
:blocks [{:block/content "p1 [[Parent page]]"
:build/children [{:block/content "[[Child page]]"}]}
{:block/content "p2 [[Parent page]]"
:build/children [{:block/content "Non linked content"}]}]}]
[{:file/path "pages/page1.md"
:file/content "foo:: bar
- p1 [[Parent page]]
- [[Child page]]
- p2 [[Parent page]]
- Non linked content"}]))
(is (= ["Non linked content"
"p2"
"p1"]
(map testable-content
(dsl-query "(and [[Parent page]] (not [[Child page]]))")))))
(deftest ^:done between-queries
(load-test-files [{:file/path "journals/2020_12_26.md"
:file/content "foo::bar
- DONE 26-b1
created-at:: 1608968448113
- LATER 26-b2-modified-later
created-at:: 1608968448114
- DONE 26-b3
created-at:: 1608968448115
- 26-b4
created-at:: 1608968448116
"}])
(let [task-filter (if js/process.env.DB_GRAPH "(task todo done)" "(task later done)")]
(are [x y] (= (count (dsl-query x)) y)
(str "(and " task-filter " (between [[Dec 26th, 2020]] tomorrow))")
3
;; between with journal pages
(str "(and " task-filter " (between [[Dec 26th, 2020]] [[Dec 27th, 2020]]))")
3
;; ;; between with created-at
;; "(and (task now later done) (between created-at [[Dec 26th, 2020]] tomorrow))"
;; 3
)))
(deftest ^:done custom-query-test
(load-test-files [{:file/path "pages/page1.md"
:file/content "foo:: bar
- NOW b1
- TODO b2
- LATER b3
- b3"}])
(let [task-query (if js/process.env.DB_GRAPH
'(task doing)
'(task now))]
(is (= ["NOW b1"]
(map :block/content (custom-query {:query task-query}))))
(is (= ["NOW b1"]
(map :block/content (custom-query {:query (list 'and task-query "b")})))
"Query with rule that can't be derived from the form itself")))
(if js/process.env.DB_GRAPH
(def get-property-value query-dsl/get-db-property-value)
(def get-property-value #(get-in %1 [:block/properties %2])))
(deftest sort-by-queries
(load-test-files [{:file/path "journals/2020_02_25.md"
:file/content "rating:: 10"}
{:file/path "journals/2020_12_26.md"
:file/content "rating:: 8
- DONE 26-b1
created-at:: 1608968448113
fruit:: plum
- LATER 26-b2-modified-later
created-at:: 1608968448114
fruit:: apple
- DONE 26-b3 has no fruit to test sorting of absent property value
created-at:: 1608968448115
- 26-b4
created-at:: 1608968448116
"}])
(let [task-filter (if js/process.env.DB_GRAPH "(task todo done)" "(task later done)")]
(testing "sort-by user block property fruit"
(let [result (->> (dsl-query (str "(and " task-filter " (sort-by fruit))"))
(map #(get-property-value % :fruit)))]
(is (= ["plum" "apple" nil]
result)
"sort-by correctly defaults to desc"))
(let [result (->> (dsl-query (str "(and " task-filter " (sort-by fruit desc))"))
(map #(get-property-value % :fruit)))]
(is (= ["plum" "apple" nil]
result)
"sort-by desc"))
(let [result (->> (dsl-query (str "(and " task-filter " (sort-by fruit asc))"))
(map #(get-property-value % :fruit)))]
(is (= [nil "apple" "plum"]
result)
"sort-by asc")))
(testing "sort-by hidden, built-in block property created-at"
(let [result (->> (dsl-query (str "(and " task-filter " (sort-by created-at desc))"))
(map #(get-property-value % :created-at)))]
(is (= [1608968448115 1608968448114 1608968448113]
result))
"sorted-by desc")
(let [result (->> (dsl-query (str "(and " task-filter " (sort-by created-at asc))"))
(map #(get-property-value % :created-at)))]
(is (= [1608968448113 1608968448114 1608968448115]
result)
"sorted-by asc")))
;; FIXME: Once :number property approach resolved
#_(testing "user page property rating"
(is (= [10 8]
(->> (dsl-query "(and (page-property rating) (sort-by rating))")
(map #(get-property-value % :rating))))))))
(deftest ^:done simplify-query
(are [x y] (= (query-dsl/simplify-query x) y)
'(and [[foo]])
'[[foo]]
'(and (and [[foo]]))
'[[foo]]
'(and (or [[foo]]))
'[[foo]]
'(and (not [[foo]]))
'(not [[foo]])
'(and (or (and [[foo]])))
'[[foo]]
'(not (or [[foo]]))
'(not [[foo]])))
(comment
(require '[clojure.pprint :as pprint])
(test-helper/start-test-db!)
(query-dsl/query test-db "(task done)")
;; Useful for debugging
(prn
(datascript.core/q
'[:find (pull ?b [*])
:where
[?b :block/name]]
(frontend.db/get-db test-db)))
;; (or (priority a) (not (priority a)))
;; FIXME: Error: Insufficient bindings: #{?priority} not bound in [(contains? #{"A"} ?priority)]
(pprint/pprint
(d/q
'[:find (pull ?b [*])
:where
[?b :block/uuid]
(or (and [?b :block/priority ?priority] [(contains? #{"A"} ?priority)])
(not [?b :block/priority #{"A"}]
[(contains? #{"A"} ?priority)]))]
(frontend.db/get-db test-db))))
(when-not js/process.env.DB_GRAPH
(deftest namespace-queries
(load-test-files [{:file/path "pages/ns1.page1.md"
:file/content "foo"}
{:file/path "pages/ns1.page2.md"
:file/content "bar"}
{:file/path "pages/ns2.page1.md"
:file/content "baz"}])
(is (= #{"ns1/page1" "ns1/page2"}
(set (map :block/name (dsl-query "(namespace ns1)")))))
(is (= #{}
(set (map :block/name (dsl-query "(namespace blarg)"))))
"Correctly returns no results")))