blob: 4d4f928b9aa96c6b55f5f0e5f4b75bb319faab0f (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
|
(ns pronouns.util
(:require [clojure.string :as s]))
(defn slurp-tabfile [path]
(let [lines (s/split (slurp path) #"\n")]
(map #(s/split % #"\t") lines)))
(defn table-lookup
[query-key table]
(let [arity (count query-key)
filtered-table (filter #(= query-key (take arity %)) table)]
(first filtered-table)))
(defn tabfile-lookup
[query-key tabfile]
(table-lookup query-key (slurp-tabfile tabfile)))
(defn minimum-unambiguous-path
([pronouns-table sections] (minimum-unambiguous-path pronouns-table sections 1))
([pronouns-table sections number-of-sections]
(let [sections-subset (take number-of-sections sections)
results (filter #(= (take number-of-sections %) sections-subset) pronouns-table)]
(case (count results)
0 nil
1 (clojure.string/join "/" sections-subset)
(recur pronouns-table sections (+ number-of-sections 1))))))
(defn abbreviate
"given a list of pronoun rows, return a list of minimum unabiguous paths"
[pronouns-table]
(map (partial minimum-unambiguous-path pronouns-table) pronouns-table))
|