;; pronoun.is - a website for pronoun usage examples
;; Copyright (C) 2014 - 2016 Morgan Astra
;; This program is free software: you can redistribute it and/or modify
;; it under the terms of the GNU Affero General Public License as
;; published by the Free Software Foundation, either version 3 of the
;; License, or (at your option) any later version.
;; This program is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU Affero General Public License for more details.
;; You should have received a copy of the GNU Affero General Public License
;; along with this program. If not, see
(ns pronouns.util
(:require [clojure.string :as s]))
(defn print-and-return "for debugging" [x] (println x) x)
(defn slurp-tabfile [path]
"read a tabfile from a filesystem as a table"
(let [lines (s/split (slurp path) #"\n")]
(map #(s/split % #"\t") lines)))
(defn table-front-filter
"filter a to the rows which begin with "
[query-key table]
(let [arity (count query-key)]
(filter #(= query-key (take arity %)) table)))
(defn table-end-filter
"filter a to the rows which end with "
[query-key table]
(let [table-arity (count (first table))
query-arity (count query-key)]
(filter #(= query-key (drop (- table-arity query-arity) %)) table)))
(defn table-lookup
"find the row corresponding to in "
[query-key table]
(if (some #(= "..." %) query-key)
(let [[query-front query-end-] (split-with #(not= "..." %) query-key)
query-end (drop 1 query-end-)
front-matches (table-front-filter query-front table)]
(first (table-end-filter query-end front-matches)))
(first (table-front-filter query-key table))))
(defn shortest-unambiguous-forward-path
"Compute the shortest (in number of path elements) forward path which
unambiguously refers to a specific in a . The behavior of
this function is undefined if given a that is not in the .
See also: shortest-unambiguous-path"
[table row]
(loop [n 1]
(let [row-front (take n row)]
(if (>= 1 (count (table-front-filter row-front table)))
row-front
(recur (inc n))))))
(defn shortest-unambiguous-ellipses-path
"Compute the shortest (in number of path elements) ellipses path which
unambiguously refers to a specific in a . The behavior of
this function is undefined if given a that is not in the .
See also: shortest-unambiguous-path"
[table row]
(let [row-end (last row)
filtered-table (table-end-filter [row-end] table)]
(loop [n 1]
(let [row-front (take n row)]
(if (>= 1 (count (table-front-filter row-front filtered-table)))
(concat row-front ["..." row-end])
(recur (inc n)))))))
(defn shortest-unambiguous-path
"Compute the shortest (in number of path elements) path which unambiguously
refers to a specific in a . The behavior of this function is
undefined if given a that is not in the .
A path can either be a 'forward path', in which it specifies the row with
elements from the front (e.g. ze/zir), or an 'ellipses path', which elides
unnecessary elements from the middle (e.g. they/.../themselves). If the
shortest forward and ellipses paths are the same length, prefer the forward
path"
[table row]
(let [forward-path (shortest-unambiguous-forward-path table row)
ellipses-path (shortest-unambiguous-ellipses-path table row)]
(s/join "/"
(if (> (count forward-path) (count ellipses-path))
ellipses-path
forward-path))))
(defn abbreviate
"return the list of minimum unabiguous paths from a "
[table]
(map (partial shortest-unambiguous-path table) table))
(defn vec-coerce [x]
"wrap a value in a vector if it is not already in one. note that if
is already in a sequence for which vector? is false, this will add
another layer of nesting."
(if (vector? x) x [x]))