-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathschema-el-eval.lisp
514 lines (416 loc) · 13.4 KB
/
schema-el-eval.lisp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
(load "ll-load.lisp")
(ll-load "ll-util.lisp")
(ll-load "ll-cache.lisp")
(ll-load "schema-el.lisp")
(ll-load "schema-unify.lisp")
(ll-load "schema-el-lex.lisp")
(ll-load "schema-time.lisp")
(ll-load "schema-kb.lisp")
(defparameter *BLANK-SCHEMA*
'(epi-schema ((?x blank.v) ** ?E) (:Roles))
)
(defparameter *COMPUTABLE-PREDS* (mk-hashtable (list
(list
'INANIMATE_OBJECT.N
(lambda (args kb)
(if (and
(equal 1 (length args))
(eval-prop (list (car args) 'OBJECT.N) kb)
(not (eval-prop (list (car args) 'AGENT.N) kb))
) (eval-prop-score (list (car args) 'OBJECT.N) kb) 0)
)
)
(list
'=
(lambda (args kb)
(if (loop for arg1 in args
always (loop for arg2 in args
always (equal arg1 arg2))) 1.0 0)
)
)
)))
(defparameter *KB-EXPLICIT* (make-hash-table :test #'equal))
(defparameter *KB-ARG-IND* (make-hash-table :test #'equal))
(defparameter *KB-PRED-IND* (make-hash-table :test #'equal))
(defparameter *KB* (list *KB-EXPLICIT* *KB-ARG-IND* *KB-PRED-IND*))
(defparameter *AGENT-PRONOUNS* '(
HE.PRO
SHE.PRO
I.PRO
ME.PRO
YOU.PRO
HIM.PRO
HER.PRO
THEY.PRO
THEM.PRO
WE.PRO
US.PRO
))
; (defparameter *STORY* *FLOWER-STORY*)
; Determine whether a term needs coreference
(ldefun coref? (term kb)
(or
(lex-pronoun? term)
(eval-prop (list term 'INDEF.A) kb)
)
)
; Transform a proposition into an equivalent
; one with a single argument curried out.
(ldefun curry-prop (prop carg)
(block cp
; Strip charstars
(if (canon-charstar? prop)
; then
(progn
(setf curry-res (curry (car prop) carg))
(return-from cp (list (car curry-res) (second curry-res) (list (third curry-res) (second prop) (third prop))))
;(return-from cr (curry (car prop) carg))
)
)
; Don't curry a predicate that's already monadic
(if (equal 1 (length (prop-all-args prop)))
(return-from cp prop))
(list carg (curry prop carg))
)
)
; Generate all possible monadic curry
; propositions from an n-adic one
(ldefun all-curries (prop)
(loop for arg in (prop-all-args prop)
collect (curry-prop prop arg)
)
)
; Get all terms to which predicates apply that can be
; unified with a given predicate
(ldefun get-pred-uni-terms (pred kb whole-story)
(block gput
(setf terms (list))
(loop for cand-pred being the hash-keys of (kb-pred-ind kb)
do (block unil
(dbg 'coref "pred is ~s~%" pred)
(dbg 'coref "cand-pred is ~s~%" cand-pred)
(dbg 'coref "~%")
(if (not (unify-preds pred cand-pred (make-hash-table :test #'equal) *BLANK-SCHEMA* whole-story))
(return-from unil)
)
(loop for term in (gethash cand-pred (kb-pred-ind kb))
do (push term terms)
)
)
)
(return-from gput (remove-duplicates terms :test #'equal))
)
)
; Get all predicates that apply to a term
(ldefun get-term-preds (term kb)
(remove-duplicates
(append
(loop for prop in (gethash term (kb-arg-ind kb))
if (not (null (curry prop prop)))
collect (curry prop term)
)
; TODO: figure out a better way to enumerate implicitly-true preds?
; or maybe too hard in general?
(loop for pred in *IRREGULAR-PREDS*
if (eval-prop (list term pred) kb)
collect pred
)
) :test #'equal)
)
; Get all terms to which a predicate applies
; TODO: do this much more efficiently for complex predicates
; (e.g. disjunctions)
(ldefun get-pred-terms (pred kb)
(loop for term being the hash-keys of (kb-arg-ind kb)
if (eval-prop (list term pred) kb)
collect term
)
)
(ldefun subsumes-prop? (gen-prop spec-prop)
(ll-cache #'u-subsumes-prop?
(list gen-prop spec-prop) 100 nil)
)
(ldefun u-subsumes-prop? (gen-prop spec-prop)
(block outer
(setf gen-papm (prop-args-pred-mods gen-prop))
(setf gen-pre (car gen-papm))
(setf gen-pred (second gen-papm))
(setf gen-post (third gen-papm))
(setf gen-mods (fourth gen-papm))
(setf spec-papm (prop-args-pred-mods spec-prop))
(setf spec-pre (car spec-papm))
(setf spec-pred (second spec-papm))
(setf spec-post (third spec-papm))
(setf spec-mods (fourth spec-papm))
; TODO: account for mods here. Can we ignore?
(if (and
(equal gen-pre spec-pre)
(equal gen-post spec-post)
(subsumes gen-pred spec-pred))
; then
(return-from outer t)
)
)
)
; Evaluate whether a proposition is true given a knowledge base
(ldefun eval-prop (prop kb)
(> (eval-prop-score prop kb) 0)
)
; Evaluate whether a proposition is true given no knowledge base
(ldefun eval-single-prop (prop)
(> (eval-prop-score prop *KB*) 0)
)
(ldefun skolemized-agent-pronoun? (arg)
(let ((no-nums (intern (join-str-list "" (loop for c across (string arg) if (not (is-digit? c)) collect (string c))))))
(and
(lex-skolem? no-nums)
(equal (car (last (split-str (string no-nums) "-"))) "PRO.SK")
(not (null (member (intern (concat-strs (car (split-str (string no-nums) "-")) ".PRO")) *AGENT-PRONOUNS* :test #'equal)))
)
)
)
(ldefun eval-prop-score (prop kb)
(let (arg)
(block outer
; Only lists are propositions
(if (not (listp prop)) (return-from outer 'ERROR))
(setf pred (prop-pred prop))
(setf args (prop-all-args prop))
(setf mods (prop-mods prop))
;(dbg 'coref "prop ~s~%" prop)
;(dbg 'coref "pred ~s~%" pred)
;(dbg 'coref "args ~s~%" args)
;(dbg 'coref "mods ~s~%" mods)
;(dbg 'coref "~%")
; (format t "raw proposition: ~s~%" prop)
; (format t "canonical proposition: ~s(" pred)
;(loop for arg in args
; do (format t " ~s " arg)
;)
;(format t ")~%")
;(if (> (length mods) 0) (block print-mods
; (format t " prop modifiers:~%")
; (loop for mod in mods
; do (format t " ~s~%" mod)
; )
;))
; Strip negations
(if (equal (car prop) 'NOT)
(return-from outer (if (eval-prop (second prop) kb) 0 1.0)))
; Check for explicit knowledge of this or its negation.
(if (gethash prop (kb-explicit kb))
(return-from outer 1.0)
)
(if (gethash (list 'NOT prop) (kb-explicit kb))
(return-from outer 0)
)
; Handle temporal predicates.
(if (time-prop? prop)
; then
(block do-eval-time-prop
(setf story-time-props (loop for p being the hash-keys of (kb-explicit kb) if (time-prop? p) collect p))
(load-time-model story-time-props)
(return-from outer (if (eval-time-prop prop) 1.0 0))
)
)
; Check for subsuming predicates in the KB.
; TODO: optimize this somehow. Use kb-arg-ind, or
; change indexing to account for subsumptions?
(loop for kbp being the hash-keys of (kb-explicit kb)
; If the KB prop is more specific, the general
; test prop is implied
if (subsumes-prop? prop kbp)
do (return-from outer (subsumption-score (prop-pred prop) (prop-pred kbp)))
if (subsumes-prop? kbp prop)
do (return-from outer (* 0.75 (subsumption-score (prop-pred kbp) (prop-pred prop))))
)
; Special cases for implicitly evaluable monadic predicates
(if (and (equal 2 (length prop)) (equal 1 (length args))) (block monadic-special-cases
(setf arg (car args))
; Names refer to agents.
(if (and (symbolp arg) (has-suffix? (string arg) ".NAME"))
(if (equal pred 'AGENT.N)
(return-from outer 1.0))
)
; He and she pronouns refer to agents.
; TODO: handle "they"
(if (and (symbolp arg) (or
(member arg *AGENT-PRONOUNS* :test #'equal)
; Might be a Skolemized pronoun
(skolemized-agent-pronoun? arg)
))
(if (equal pred 'AGENT.N)
(return-from outer 1.0))
)
; KA-abstractions are actions.
(if (and (equal pred 'ACTION.N)
(canon-kind? arg)
(equal (car arg) 'KA))
; then
(return-from outer 0.25)
)
; KE-abstractions are events.
(if (and (equal pred 'EVENT.N)
(canon-kind? arg)
(equal (car arg) 'KE))
; then
(return-from outer 0.25)
)
))
; Check computable predicates
(if (not (null (gethash pred *COMPUTABLE-PREDS*)))
(return-from outer (funcall (gethash pred *COMPUTABLE-PREDS*) args kb))
)
; If we have a kind, check whether the stipulated predicate
; subsumes the kind's predicate.
(if (and (equal 1 (length args)) (listp (car args)) (equal 'K (car (car args))))
(return-from outer (max
(subsumption-score pred (second (car args)))
(* 0.75 (subsumption-score (second (car args)) pred))
))
)
; Handle "OR"s
(if (not (null (member 'OR prop))) (block handle-or
(loop for e in prop
if (not (equal 'OR e)) do (block handle-or-inner
(setf ep-res (eval-prop e kb))
(if (equal 'ERROR ep-res) (return-from outer 'ERROR))
(if ep-res (return-from outer 1.0))
)
)
; Nothing evaluated to t
(return-from outer 0.0)
))
; Handle "ANDs"
(if (not (null (member 'AND prop))) (block handle-or
(loop for e in prop
if (not (equal 'AND e)) do (block handle-or-inner
(setf ep-res (eval-prop e kb))
(if (equal 'ERROR ep-res) (return-from outer 'ERROR))
(if (null ep-res) (return-from outer 0))
)
)
; Nothing evaluated to nil
(return-from outer 1.0)
))
(return-from outer 0.0)
))
)
(ldefun safe-inc (n)
(if (null n) 1 (+ n 1))
)
(defparameter *IRREGULAR-PREDS* '(
AGENT.N
))
(ldefun irregular-pred? (pred)
(not (null (member pred *IRREGULAR-PREDS* :test #'equal)))
)
; Add some "basic world knowledge"
;(add-to-kb '(FRANK.NAME MALE.A) *KB*)
;(add-to-kb '(MAY.NAME FEMALE.A) *KB*)
;(add-to-kb '(HE.PRO MALE.A) *KB*)
;(add-to-kb '(SHE.PRO FEMALE.A) *KB*)
;(add-to-kb '(HE.PRO AGENT1.N))
;(add-to-kb '(HE.PRO MALE.A))
; TODO: "they" should also admit male or female
; individuals, probably, but the subject/object
; distinction will be a little subtle to intuit
; which one is best. Also, that'll require a
; lambda predicate for the disjunction, so
; eval-prop will have to do that, and maybe even
; some lexical scoping. Boo. :(
; ALSO TODO: eval-prop needs to account for predicate
; hierarchies. So, (FLOWERS1.SK SET-OF (K FLOWER.N))
; should cause an evaluation of (FLOWERS1.SK SET-OF (K OBJECT.N))
; to return true. Also, (FLOWERS1.SK SET-OF (K (YELLOW.A FLOWER.N)))
; should return true. Tricky....
;(add-to-kb '(THEY.PRO SET.N) *KB*)
(add-to-kb '(THEY.PRO SET_OF.PR (K OBJECT.N)) *KB*)
; Process the story one sentence at a time, so we can do
; coreference analysis in one pass. Output the story with
; all coreferences resolved.
(ldefun process-story-coref (story kb) (let (corefs) (block outer
(setf new-story (list))
(loop for conj in story do (block loop_outer
; Make a coreference map for the sentence
(setf corefs (make-hash-table :test #'equal))
; Add all propositions to the KB, indexed by their arguments
(loop for wff in conj do (block loop_inner
(add-to-kb wff kb)
))
; Store the indexed sentence with its old indices.
; That way, when we replace terms in it one by one,
; we can replace them with dummy indices and not have
; to re-index, which could break the indices in the
; index->referent map we'll make.
(setf old-idx-conj (el-idcs conj))
; Find story terms that need coreference
;(format t "conj is ~s~%" conj)
;(format t "idx conj is ~s~%" old-idx-conj)
;(format t "terms are ~s~%" (get-elements-pred-pairs conj #'term?))
(loop for e-pair in (get-elements-pred-pairs conj #'term?)
do (setf e (car e-pair))
do (setf e-idx (second e-pair))
; do (format t "e is ~s~%" e)
if (coref? e kb) do (block resolve-coref
; For each pred, find other terms w/ that pred
(setf share-count (make-hash-table :test #'equal))
(loop for pred in (get-term-preds e kb)
if (not (equal pred 'INDEF.A))
; do (format t "~s: ~s~%" pred (gethash pred (kb-pred-ind kb)))
; do (format t "pred is ~s~%" pred)
append (loop for term in (get-pred-uni-terms pred kb story)
if (not (equal term e))
; collect term
do (setf (gethash term share-count) (safe-inc (gethash term share-count)))
)
)
(setf max-count 0)
(setf max-coref nil)
(loop for term being the hash-keys of share-count
if (>= (gethash term share-count) max-count)
do (block update
(setf max-count (gethash term share-count))
(setf max-coref term)
)
)
; (format t "best coreference for ~s: ~s (~s shared preds)~%" e max-coref max-count)
(if (not (null max-coref))
(setf (gethash e-idx corefs) max-coref))
)
)
;(format t "~%~%")
;(format t "old sentence: ~s~%" conj)
;(format t "resolutions:~%")
(setf new-sent old-idx-conj)
;(format t "new-sent: ~s~%" new-sent)
(loop for idx being the hash-keys of corefs
; We're using the helpers because we've already done
; the indexing ourselves; we want to use the old indices
; for replacement, remember? We're also going to use a
; dummy index (-1) for the substitutions so we don't
; consider them during replacements. All these indices
; get cleaned at the end, so it's fine.
do (setf new-sent (replace-element-idx-helper new-sent idx (gethash idx corefs)))
do (setf elem (clean-idcs (get-element-idx-helper old-idx-conj idx)))
;do (format t "new new sent: ~s~%" new-sent)
do (format t " ~s -> ~s~%" elem (gethash idx corefs))
; So, up till now, we've only replaced the original instances of a term
; that triggered coreference resolution, i.e., pronouns & "the"-determined
; terms. But in the case of absolute names, like FLOWERS2.SK -> FLOWERS1.SK,
; we want to make *all* substitutions, because once they map somewhere,
; they map anywhere (unlike complex terms in general).
if (lex-const? elem)
do (setf new-sent (replace-vals elem (gethash idx corefs) new-sent))
)
(setf new-sent (clean-idcs new-sent))
;(format t "resolved sentence: ~s~%" new-sent)
; (push new-sent new-story)
(setf new-story (append new-story (list new-sent)))
)
)
(return-from outer new-story)
)))
;(format t "old story: ~s~%" *STORY*)
;(format t "new story: ~s~%" (process-story-coref *STORY* *KB*))
;(eval-prop '(MAY.NAME EAT.V (K BALL.N) (ADV-A (WITH.P (K GUSTO.N)))) *KB*)