Add rule size test infrastructure
author |
Steve Losh <steve@stevelosh.com> |
date |
Sat, 20 May 2017 11:24:54 +0000 |
parents |
77a187682a5d |
children |
50011302bb36 |
(in-package :scully.gdl)
(in-readtable :fare-quasiquote)
;;;; Utils --------------------------------------------------------------------
(defvar *ggp-gensym-counter* 0)
(defun gensym-ggp ()
"Return a unique symbol in the `ggp-rules` package."
(values (intern (mkstr 'rule- (incf *ggp-gensym-counter*))
(find-package :ggp-rules))))
;;;; Files --------------------------------------------------------------------
(defun read-gdl (filename)
"Read GDL from the given file"
(let ((*package* (find-package :ggp-rules)))
(with-open-file (stream filename)
(loop
:with done = (gensym)
:for form = (read stream nil done)
:while (not (eq form done))
:collect form))))
(defun dump-gdl (rules &optional stream)
(let ((*package* (find-package :ggp-rules)))
(format stream "~(~{~S~%~}~)" rules)))
;;;; Temperance ---------------------------------------------------------------
(defun load-rules (database rules)
(push-logic-frame-with database
(mapc (lambda (rule)
(if (and (consp rule)
(eq (car rule) 'ggp-rules::<=))
(apply #'invoke-rule database (cdr rule))
(invoke-fact database rule)))
rules)))
;;;; Normalization ------------------------------------------------------------
;;; Normalization takes a set of clauses from raw GDL format and turns them into
;;; friendlier Lispy clauses of the form:
;;;
;;; (head . body)
;;;
;;; * (<= head . body) becomes (head . body)
;;; * (fact) becomes ((fact)), i.e. ((fact) . nil)
;;; * Nullary predicates like terminal have their parens added back.
;;;
;;; So something like (<= terminal (true foo) (not bar)) would become:
;;;
;;; ((terminal)
;;; (true foo)
;;; (not (bar)))
(defun-match normalize-term (term)
(`(ggp-rules::not ,body) `(ggp-rules::not ,(normalize-term body)))
(`(,_ ,@_) term)
(sym `(,sym)))
(defun-match normalize-rule (rule)
(`(ggp-rules::<= ,head ,@body)
`(,(normalize-term head) ,@(mapcar #'normalize-term body)))
(fact `(,(normalize-term fact))))
(defun normalize-rules (gdl-rules)
(mapcar #'normalize-rule gdl-rules))
;;;; Rule Data Access ---------------------------------------------------------
(defun-match bare-term (term)
(`(ggp-rules::not ,x) x)
(_ term))
(defun-match negationp (term)
(`(ggp-rules::not ,_) t)
(_ nil))
(defun-ematch term-predicate (term)
(`(ggp-rules::not (,predicate ,@_)) predicate)
(`(,predicate ,@_) predicate))
(defun-ematch rule-head (rule)
(`(,head ,@_) head))
(defun-ematch rule-body (rule)
(`(,_ ,@body) body))
(defun rule-predicate (rule)
(term-predicate (rule-head rule)))
(defun rule-head= (rule term &optional (predicate #'=))
(funcall predicate (rule-head rule) term))
;;;; Rule Splitting -----------------------------------------------------------
;;; Rules with many terms in their bodies are difficult to make rule trees for,
;;; because the size of the tree grows exponentially. We can fix this problem
;;; by splitting large disjunctions into separate rules.
(defparameter *max-rule-size* 8)
(defun split-rule (head bodies)
(if (<= (length bodies) *max-rule-size*)
(values (mapcar (curry #'cons head) bodies) nil)
(iterate
(for chunk :in (subdivide bodies *max-rule-size*))
(for new-head = (list (gensym-ggp)))
(collecting new-head :into new-heads)
(appending (mapcar (curry #'cons new-head) chunk)
:into new-rules)
(finally
(return (values (append new-rules
(mapcar (lambda (new-head)
(list head new-head))
new-heads))
t))))))
(defun split-rules% (normalized-rules)
(let ((rules (group-by #'rule-head normalized-rules :test #'equal)))
(iterate
(for (head instances) :in-hashtable rules)
(for bodies = (mapcar #'rule-body instances))
(for (values new-instances needed-split) = (split-rule head bodies))
(oring needed-split :into ever-needed-split)
(appending new-instances :into new-rules)
(finally (return (values new-rules ever-needed-split))))))
(defun split-rules (normalized-rules)
(iterate (for (values rules needed-split)
:first (values normalized-rules t)
:then (split-rules% rules))
(for c :from 0)
(while needed-split)
(finally (return (values rules c)))))