;; pronoun.is - a website for pronoun usage examples ;; Copyright (C) 2014 - 2017 Morgan Astra ;; This program is free software: you can redistribute it and/or modify ;; it under the terms of the GNU Affero General Public License as ;; published by the Free Software Foundation, either version 3 of the ;; License, or (at your option) any later version. ;; This program is distributed in the hope that it will be useful, ;; but WITHOUT ANY WARRANTY; without even the implied warranty of ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the ;; GNU Affero General Public License for more details. ;; You should have received a copy of the GNU Affero General Public License ;; along with this program. If not, see <http://www.gnu.org/licenses/> (ns pronouns.util (:require [clojure.string :as s])) (defn print-and-return "for debugging" [x] (println x) x) (defn slurp-tabfile [path] "read a tabfile from a filesystem <path> as a table" (let [lines (s/split (slurp path) #"\n")] (map #(s/split % #"\t") lines))) (defn table-front-filter "filter a <table> to the rows which begin with <query-key>" [query-key table] (let [arity (count query-key)] (filter #(= query-key (take arity %)) table))) (defn table-end-filter "filter a <table> to the rows which end with <query-key>" [query-key table] (let [table-arity (count (first table)) query-arity (count query-key)] (filter #(= query-key (drop (- table-arity query-arity) %)) table))) (defn table-lookup "find the row corresponding to <query-key> in <table>" [query-key table] (if (some #(= "..." %) query-key) (let [[query-front query-end-] (split-with #(not= "..." %) query-key) query-end (drop 1 query-end-) front-matches (table-front-filter query-front table)] (first (table-end-filter query-end front-matches))) (first (table-front-filter query-key table)))) (defn shortest-unambiguous-forward-path "Compute the shortest (in number of path elements) forward path which unambiguously refers to a specific <row> in a <table>. The behavior of this function is undefined if given a <row> that is not in the <table>. See also: shortest-unambiguous-path" [table row] (loop [n 1] (let [row-front (take n row)] (if (>= 1 (count (table-front-filter row-front table))) row-front (recur (inc n)))))) (defn shortest-unambiguous-ellipses-path "Compute the shortest (in number of path elements) ellipses path which unambiguously refers to a specific <row> in a <table>. The behavior of this function is undefined if given a <row> that is not in the <table>. See also: shortest-unambiguous-path" [table row] (let [row-end (last row) filtered-table (table-end-filter [row-end] table)] (loop [n 1] (let [row-front (take n row)] (if (>= 1 (count (table-front-filter row-front filtered-table))) (concat row-front ["..." row-end]) (recur (inc n))))))) (defn shortest-unambiguous-path "Compute the shortest (in number of path elements) path which unambiguously refers to a specific <row> in a <table>. The behavior of this function is undefined if given a <row> that is not in the <table>. A path can either be a 'forward path', in which it specifies the row with elements from the front (e.g. ze/zir), or an 'ellipses path', which elides unnecessary elements from the middle (e.g. they/.../themselves). If the shortest forward and ellipses paths are the same length, prefer the forward path" [table row] (let [forward-path (shortest-unambiguous-forward-path table row) ellipses-path (shortest-unambiguous-ellipses-path table row)] (s/join "/" (if (> (count forward-path) (count ellipses-path)) ellipses-path forward-path)))) (defn abbreviate "return the list of minimum unabiguous paths from a <table>" [table] (map (partial shortest-unambiguous-path table) table)) (defn vec-coerce [x] "wrap a value <x> in a vector if it is not already in one. note that if <x> is already in a sequence for which vector? is false, this will add another layer of nesting." (if (vector? x) x [x])) (defn strip-markup [form] (s/join " " (filter string? (flatten form))))