kevinwang676's picture
Upload 403 files
c06b7e2
raw
history blame
No virus
7.9 kB
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
;;; ;;
;;; Centre for Speech Technology Research ;;
;;; University of Edinburgh, UK ;;
;;; Copyright (c) 1996-2011 ;;
;;; All Rights Reserved. ;;
;;; ;;
;;; Permission is hereby granted, free of charge, to use and distribute ;;
;;; this software and its documentation without restriction, including ;;
;;; without limitation the rights to use, copy, modify, merge, publish, ;;
;;; distribute, sublicense, and/or sell copies of this work, and to ;;
;;; permit persons to whom this work is furnished to do so, subject to ;;
;;; the following conditions: ;;
;;; 1. The code must retain the above copyright notice, this list of ;;
;;; conditions and the following disclaimer. ;;
;;; 2. Any modifications must be clearly marked as such. ;;
;;; 3. Original authors' names are not deleted. ;;
;;; 4. The authors' names are not used to endorse or promote products ;;
;;; derived from this software without specific prior written ;;
;;; permission. ;;
;;; ;;
;;; THE UNIVERSITY OF EDINBURGH AND THE CONTRIBUTORS TO THIS WORK ;;
;;; DISCLAIM ALL WARRANTIES WITH REGARD TO THIS SOFTWARE, INCLUDING ;;
;;; ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS, IN NO EVENT ;;
;;; SHALL THE UNIVERSITY OF EDINBURGH NOR THE CONTRIBUTORS BE LIABLE ;;
;;; FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES ;;
;;; WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN ;;
;;; AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ;;
;;; ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF ;;
;;; THIS SOFTWARE. ;;
;;; ;;
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
;;;
;;; Some functions for manipulating decision trees
;;;
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
(define (cart_prune_tree_thresh tree threshold default)
"(prune_cart_tree_thresh TREE THRESHOLD DEFAULT)
Prune the classification tree TREE so that all tail nodes with
a prediction probabality less than THRESHOLD and changed to return
DEFAULT instead. This may be used when different mistakes have actually
different penalites hence some control of the defaults need to be
controlled."
(cond
((cdr tree) ;; a question
(list
(car tree)
(cart_prune_tree_thresh (car (cdr tree)) threshold default)
(cart_prune_tree_thresh (car (cdr (cdr tree))) threshold default)))
((< (cart_class_probability (car tree)) threshold)
(list (list (list threshold default) default)))
(t ;; leave asis
tree)))
(define (cart_class_probability class)
"(cart_class_probability CLASS)
Returns the probability of the best class in the cart leaf node CLASS.
If CLASS simple has a value and now probabilities the probabilities
it assume to be 1.0."
(let ((val 0.0))
(set! val (assoc (car (last class)) class))
(if val
(car (cdr val))
1.0)))
(define (cart_class_prune_merge tree)
"(cart_class_prune_merge tree)
Prune all sub trees which are pure. That is they all predict the
same class. This can happen when some other pruning technique
as modified a sub-tree now making it pure."
(let ((pure (cart_tree_pure tree)))
(cond
(pure pure)
((cdr tree);; a question
(list
(car tree)
(cart_class_prune_merge (car (cdr tree)))
(cart_class_prune_merge (car (cdr (cdr tree))))))
(t;; a leaf leave asis
tree))))
(define (cart_tree_pure tree)
"(cart_tree_pure tree)
Returns a probability density function if all nodes in this tree
predict the same class and nil otherwise"
(cond
((cdr tree)
(let ((left (cart_tree_pure (car (cdr tree))))
(right (cart_tree_pure (car (cdr (cdr tree))))))
(cond
((not left) nil)
((not right) nil)
((equal? (car (last left)) (car (last right)))
left)
(t
nil))))
(t ;; its a leaf, so of couse its pure
tree)))
(define (cart_simplify_tree tree map)
"(cart_simplify_tree TREE)
Simplify a CART tree by reducing probability density functions to
simple single clasifications (no probabilities). This removes valuable
information from the tree but makes them smaller easier to read by humans
and faster to read by machines. Also the classes may be mapped by the assoc
list in map. The bright ones amongst you will note this could be
better and merge 'is' operators into 'in' operators in some situations
especially if you are ignoring actual probability distributions."
(cond
((cdr tree)
(list
(car tree)
(cart_simplify_tree (car (cdr tree)) map)
(cart_simplify_tree (car (cdr (cdr tree))) map)))
(t
(let ((class (car (last (car tree)))))
(if (assoc class map)
(list (cdr (assoc class map)))
(list (last (car tree))))))))
(define (cart_simplify_tree2 tree)
"(cart_simplify_tree2 TREE)
Simplify a CART tree by reducing probability density functions to
only non-zero probabilities."
(cond
((cdr tree)
(list
(car tree)
(cart_simplify_tree2 (car (cdr tree)))
(cart_simplify_tree2 (car (cdr (cdr tree))))))
(t
(list
(cart_remove_zero_probs (car tree))))))
(define (cart_remove_zero_probs pdf)
"(cart_remove_zero_probs pdf)
Removes zero probability classes in pdf, last in list
is best in class (as from cart leaf node)."
(cond
((null (cdr pdf)) pdf)
((equal? 0 (car (cdr (car pdf))))
(cart_remove_zero_probs (cdr pdf)))
(t
(cons
(car pdf)
(cart_remove_zero_probs (cdr pdf))))))
(define (cart_interpret_debug i tree)
"(cart_interpret_debug i tree)
In comparing output between different implementations (flite vs festival)
This prints out the details as it interprets the tree."
(cond
((cdr tree) ;; question
(format t "%s %s %s\n" (car (car tree)) (upcase (cadr (car tree)))
(car (cddr (car tree))))
(set! a (item.feat i (car (car tree))))
(format t "%s\n" a)
(cond
((string-equal "is" (cadr (car tree)))
(if (string-equal a (car (cddr (car tree))))
(begin
(format t " YES\n")
(cart_interpret_debug i (car (cdr tree))))
(begin
(format t " NO\n")
(cart_interpret_debug i (car (cddr tree))))))
((string-equal "<" (cadr (car tree)))
(if (< (parse-number a) (parse-number (car (cddr (car tree)))))
(begin
(format t " YES\n")
(cart_interpret_debug i (car (cdr tree))))
(begin
(format t " NO\n")
(cart_interpret_debug i (car (cddr tree))))))
(t
(format t "unknown q type %l\n" (car tree)))))
(t ;; leaf
(car tree)
)))
;;;
;;; Prediction tree for OLS trees
;;; applies OLS coefficients from appropriate leaf of tree
;;;
(define (ols_tree_predict i tree)
;; Surprisingly simple function does the necessary work
(let ((p (wagon i tree)))
(apply
+
(cons
(cadr (car (car p))) ;; Intercept
(mapcar
(lambda (fp)
;; get feature value and multiple by coefficent
(* (parse-number (item.feat i (car fp))) (cadr fp)))
(cdr (car p)))))))
(provide 'cart_aux)