moved data handling/management/etc into own directory.
[CommonLispStat.git] / ls-demo.lisp
blob48fd1b9816d5f208260da3f9ca5eff066a419eca
1 ;;; -*- mode: lisp -*-
2 ;;; Copyright (c) 2007, by A.J. Rossini <blindglobe@gmail.com>
3 ;;; See COPYRIGHT file for any additional restrictions (BSD license).
4 ;;; Since 1991, ANSI was finally finished. Edited for ANSI Common Lisp.
6 ;;; Time-stamp: <2008-08-15 16:05:27 tony>
7 ;;; Creation: <2007-01-01 09:21:50 user> WRONG
8 ;;; File: ls-demo.lisp
9 ;;; Author: AJ Rossini <blindglobe@gmail.com>
10 ;;; Copyright: (c) 2007, AJ Rossini. BSD.
11 ;;; Purpose: demonstrations of how one might use CLS.
13 ;;; What is this talk of 'release'? Klingons do not make software
14 ;;; 'releases'. Our software 'escapes', leaving a bloody trail of
15 ;;; designers and quality assurance people in its wake.
17 (in-package :cl-user)
18 ;;(asdf:oos 'asdf:load-op 'lift) ;; we need this, but I don't know why?
19 ;; hacked by simply doing this in the lispstat.asd UGLY hack.
20 ;; (asdf:oos 'asdf:load-op 'cffi)
21 ;; (asdf:oos 'asdf:compile-op 'lispstat :force t)
22 ;; (asdf:oos 'asdf:compile-op 'lispstat)
23 (asdf:oos 'asdf:load-op 'lispstat)
25 ;;; non-rigorous check for exports.
26 ;;; This is generally not how I expect it to be used.
28 (in-package :cl-user)
29 (lisp-stat:binomial-quant 0.95 3 0.4) ;;; 3
30 (lisp-stat:binomial-quant 0 3 0.4) ;;; 0
31 (lisp-stat:normal-rand 20) ;;; 20 floating-point numbers :-)
33 ;;;; THIS is how I expect it to be used, either with work in ls-user,
34 ;;;; or a cloned package similar to ls-user.
36 (in-package :ls-user)
38 ;;;; Matrix algebra.
40 (chol-decomp #2A((2 3 4) (1 2 4) (2 4 5)))
41 ;; (#2A((1.7888543819998317 0.0 0.0)
42 ;; (1.6770509831248424 0.11180339887498929 0.0)
43 ;; (2.23606797749979 2.23606797749979 3.332000937312528e-8))
44 ;; 5.000000000000003)
48 (defvar my-chol-decomp-test (chol-decomp #2A((2 3 4) (1 2 4) (2 4 5))))
49 my-chol-decomp-test
50 (nth 0 my-chol-decomp-test)
51 (nth 1 my-chol-decomp-test)
54 (lu-decomp #2A((2 3 4) (1 2 4) (2 4 5)))
55 ;; (#2A((2.0 3.0 4.0) (1.0 1.0 1.0) (0.5 0.5 1.5)) #(0 2 2) -1.0 NIL)
57 (lu-solve
58 (lu-decomp #2A((2 3 4) (1 2 4) (2 4 5)))
59 #(2 3 4))
60 ;; #(-2.333333333333333 1.3333333333333335 0.6666666666666666)
62 (inverse #2A((2 3 4) (1 2 4) (2 4 5)))
63 ;; #2A((2.0 -0.33333333333333326 -1.3333333333333335)
64 ;; (-1.0 -0.6666666666666666 1.3333333333333333)
65 ;; (0.0 0.6666666666666666 -0.3333333333333333))
67 (sv-decomp #2A((2 3 4) (1 2 4) (2 4 5)))
68 ;; (#2A((-0.5536537653489974 0.34181191712789266 -0.7593629708013371)
69 ;; (-0.4653437312661058 -0.8832095891230851 -0.05827549615722014)
70 ;; (-0.6905959164998124 0.3211003503429828 0.6480523475178517))
71 ;; #(9.699290438141343 0.8971681569301373 0.3447525123483081)
72 ;; #2A((-0.30454218417339873 0.49334669582252344 -0.8147779426198863)
73 ;; (-0.5520024849987308 0.6057035911404464 0.5730762743603965)
74 ;; (-0.7762392122368734 -0.6242853493399995 -0.08786630745236332))
75 ;; T)
77 (qr-decomp #2A((2 3 4) (1 2 4) (2 4 5)))
78 ;; (#2A((-0.6666666666666665 0.7453559924999298 5.551115123125783e-17)
79 ;; (-0.3333333333333333 -0.2981423969999719 -0.894427190999916)
80 ;; (-0.6666666666666666 -0.5962847939999439 0.44721359549995787))
81 ;; #2A((-3.0 -5.333333333333334 -7.333333333333332)
82 ;; (0.0 -0.7453559924999292 -1.1925695879998877)
83 ;; (0.0 0.0 -1.3416407864998738)))
85 (rcondest #2A((2 3 4) (1 2 4) (2 4 5)))
86 ;; 6.8157451e7
87 ;;; CURRENTLY FAILS!!
89 (eigen #2A((2 3 4) (1 2 4) (2 4 5)))
90 ;; (#(10.656854249492381 -0.6568542494923802 -0.9999999999999996)
91 ;; (#(0.4999999999999998 0.4999999999999997 0.7071067811865475)
92 ;; #(-0.49999999999999856 -0.5000000000000011 0.7071067811865474)
93 ;; #(0.7071067811865483 -0.7071067811865466 -1.2560739669470215e-15))
94 ;; NIL)
96 (spline #(1.0 1.2 1.3 1.8 2.1 2.5)
97 #(1.2 2.0 2.1 2.0 1.1 2.8) :xvals 6)
98 ;; ((1.0 1.3 1.6 1.9 2.2 2.5)
99 ;; (1.2 2.1 2.2750696543866313 1.6465231041904045 1.2186576148879609 2.8))
101 ;;; using KERNEL-SMOOTH-FRONT, not KERNEL-SMOOTH-CPORT
102 (kernel-smooth #(1.0 1.2 1.3 1.8 2.1 2.5)
103 #(1.2 2.0 2.1 2.0 1.1 2.8) :xvals 5)
104 ;; ((1.0 1.375 1.75 2.125 2.5)
105 ;; (1.6603277642110226 1.9471748095239771 1.7938127405752287
106 ;; 1.5871511322219498 2.518194783156392))
108 (kernel-dens #(1.0 1.2 2.5 2.1 1.8 1.2) :xvals 5)
109 ;; ((1.0 1.375 1.75 2.125 2.5)
110 ;; (0.7224150453621405 0.5820045548233707 0.38216411702854214
111 ;; 0.4829822708587095 0.3485939156929503))
113 (fft #(1.0 1.2 2.5 2.1 1.8))
114 ;; #(#C(1.0 0.0) #C(1.2 0.0) #C(2.5 0.0) #C(2.1 0.0) #C(1.8 0.0))
116 (lowess #(1.0 1.2 2.5 2.1 1.8 1.2) #(1.2 2.0 2.1 2.0 1.1 2.8))
117 ;; (#(1.0 1.2 1.2 1.8 2.1 2.5))
121 ;;;; Special functions
123 ;; Log-gamma function
125 (log-gamma 3.4) ;;1.0923280596789584
129 ;;;; Probability functions
131 ;; looking at these a bit more, perhaps a more CLOSy style is needed, i.e.
132 ;; (quantile :list-or-cons loc :type type (one of 'empirical 'normal 'cauchy, etc...))
133 ;; similar for the cdf, density, and rand.
134 ;; Probably worth figuring out how to add a new distribution
135 ;; efficiently, i.e. by keeping some kind of list.
137 ;; Normal distribution
139 (normal-quant 0.95) ;;1.6448536279366268
140 (normal-cdf 1.3) ;;0.9031995154143897
141 (normal-dens 1.3) ;;0.17136859204780736
142 (normal-rand 2) ;;(-0.40502015f0 -0.8091404f0)
144 (bivnorm-cdf 0.2 0.4 0.6) ;;0.4736873734160288
146 ;; Cauchy distribution
148 (cauchy-quant 0.95) ;;6.313751514675031
149 (cauchy-cdf 1.3) ;;0.7912855998398473
150 (cauchy-dens 1.3) ;;0.1183308127104695
151 (cauchy-rand 2) ;;(-1.06224644160405 -0.4524695943939537)
153 ;; Gamma distribution
155 (gamma-quant 0.95 4.3) ;;8.178692439291645
156 (gamma-cdf 1.3 4.3) ;;0.028895150986674906
157 (gamma-dens 1.3 4.3) ;;0.0731517686447374
158 (gamma-rand 2 4.3) ;;(2.454918912880936 4.081365384357454)
160 ;; Chi-square distribution
162 (chisq-quant 0.95 3) ;;7.814727903379012
163 (chisq-cdf 1 5) ;;0.03743422675631789
164 (chisq-dens 1 5) ;;0.08065690818083521
165 (chisq-rand 2 4) ;;(1.968535826180572 2.9988646156942997)
167 ;; Beta distribution
169 (beta-quant 0.95 3 2) ;;0.9023885371149876
170 (beta-cdf 0.4 2 2.4) ;;0.4247997418541529
171 (beta-dens 0.4 2 2.4) ;;1.5964741858913518
172 (beta-rand 2 2 2.4) ;;(0.8014897077282279 0.6516371997922659)
174 ;; t distribution
176 (t-quant 0.95 3) ;;2.35336343484194
177 (t-cdf 1 2.3) ;;0.794733624298342
178 (t-dens 1 2.3) ;;0.1978163816318102
179 (t-rand 2 2.3) ;;(-0.34303672776089306 -1.142505872436518)
181 ;; F distribution
183 (f-quant 0.95 3 5) ;;5.409451318117459
184 (f-cdf 1 3.2 5.4) ;;0.5347130905510765
185 (f-dens 1 3.2 5.4) ;;0.37551128864591415
186 (f-rand 2 3 2) ;;(0.7939093442091963 0.07442694152491144)
188 ;; Poisson distribution
190 (poisson-quant 0.95 3.2) ;;6
191 (poisson-cdf 1 3.2) ;;0.17120125672252395
192 (poisson-pmf 1 3.2) ;;0.13043905274097067
193 (poisson-rand 5 3.2) ;;(2 1 2 0 3)
195 ;; Binomial distribution
197 (binomial-quant 0.95 3 0.4) ;;; DOESN'T RETURN
198 (binomial-quant 0 3 0.4) ;;; -2147483648
199 (binomial-cdf 1 3 0.4) ;;0.6479999999965776
200 (binomial-pmf 1 3 0.4) ;;0.4320000000226171
201 (binomial-rand 5 3 0.4) ;;(2 2 0 1 2)
203 ;;;; OBJECT SYSTEM
205 (in-package :ls-user)
206 (defproto *test-proto*)
207 *test-proto*
208 (defmeth *test-proto* :make-data (&rest args) nil)
210 (defvar my-proto-instance nil)
211 (setf my-proto-instance (send *test-proto* :new))
212 (send *test-proto* :own-slots)
213 (lsos::ls-object-slots *test-proto*)
214 (lsos::ls-object-methods *test-proto*)
215 (lsos::ls-object-parents *test-proto*)
216 (lsos::ls-object-preclist *test-proto*)
217 ;;; The following fail and I do not know why?
218 (send *test-proto* :has-slot 'proto-name)
219 (send *test-proto* :has-slot 'PROTO-NAME)
220 (send *test-proto* :has-slot 'make-data)
221 (send *test-proto* :has-slot 'MAKE-DATA)
222 (send *test-proto* :has-method 'make-data)
223 (send *test-proto* :has-method 'MAKE-DATA)
226 (defproto2 *test-proto3* (list) (list) (list) "test doc" t)
227 (defproto2 *test-proto4*)
228 *test-proto2*
229 (defmeth *test-proto* :make-data (&rest args) nil)
231 (defvar my-proto-instance nil)
232 (setf my-proto-instance (send *test-proto* :new))
233 (send *test-proto* :own-slots)
234 (send *test-proto* :has-slot 'proto-name)
235 (send *test-proto* :has-slot 'PROTO-NAME)
238 ;;;; Testing
240 (in-package :lisp-stat-unittests)
241 (testsuites)
242 (print-tests)
243 (run-tests)
244 (last-test-status)
245 ;;(failures)
247 (describe (run-tests :suite 'lisp-stat-ut-testsupport))
248 (describe (run-tests :suite 'lisp-stat-ut-testsupport2))
250 (testsuite-tests 'lisp-stat-ut)
251 (run-tests :suite 'lisp-stat-ut)
252 (describe (run-tests :suite 'lisp-stat-ut))
254 (run-tests :suite 'lisp-stat-ut-probdistn)
255 (describe (run-tests :suite 'lisp-stat-ut-probdistn))
256 (run-tests :suite 'lisp-stat-ut-spec-fns)
257 (describe (run-tests :suite 'lisp-stat-ut-spec-fns))
259 (find-testsuite 'lisp-stat-ut-lin-alg)
260 (testsuite-tests 'lisp-stat-ut-lin-alg)
261 (run-tests :suite 'lisp-stat-ut-lin-alg)
262 (describe (run-tests :suite 'lisp-stat-ut-lin-alg))
264 ;;;; Data Analysis test
266 (in-package :ls-user)
268 ;; LispStat 1 approach to variables
270 (progn
271 (def iron (list 61 175 111 124 130 173 169 169 160 224 257 333 199))
272 iron
273 (def aluminum (list 13 21 24 23 64 38 33 61 39 71 112 88 54))
274 aluminum
275 (def absorbtion (list 4 18 14 18 26 26 21 30 28 36 65 62 40))
276 absorbtion
278 ;; LispStat 1 approach to data frames... (list of lists).
280 (DEF DIABETES
281 (QUOTE ((80 97 105 90 90 86 100 85 97 97 91 87 78 90 86 80 90 99 85 90 90 88 95 90 92 74 98 100 86 98 70 99 75 90 85 99 100 78 106 98 102 90 94 80 93 86 85 96 88 87 94 93 86 86 96 86 89 83 98 100 110 88 100 80 89 91 96 95 82 84 90 100 86 93 107 112 94 93 93 90 99 93 85 89 96 111 107 114 101 108 112 105 103 99 102 110 102 96 95 112 110 92 104 75 92 92 92 93 112 88 114 103 300 303 125 280 216 190 151 303 173 203 195 140 151 275 260 149 233 146 124 213 330 123 130 120 138 188 339 265 353 180 213 328 346)
282 (356 289 319 356 323 381 350 301 379 296 353 306 290 371 312 393 364 359 296 345 378 304 347 327 386 365 365 352 325 321 360 336 352 353 373 376 367 335 396 277 378 360 291 269 318 328 334 356 291 360 313 306 319 349 332 323 323 351 478 398 426 439 429 333 472 436 418 391 390 416 413 385 393 376 403 414 426 364 391 356 398 393 425 318 465 558 503 540 469 486 568 527 537 466 599 477 472 456 517 503 522 476 472 455 442 541 580 472 562 423 643 533 1468 1487 714 1470 1113 972 854 1364 832 967 920 613 857 1373 1133 849 1183 847 538 1001 1520 557 670 636 741 958 1354 1263 1428 923 1025 1246 1568)
283 (124 117 143 199 240 157 221 186 142 131 221 178 136 200 208 202 152 185 116 123 136 134 184 192 279 228 145 172 179 222 134 143 169 263 174 134 182 241 128 222 165 282 94 121 73 106 118 112 157 292 200 220 144 109 151 158 73 81 151 122 117 208 201 131 162 148 130 137 375 146 344 192 115 195 267 281 213 156 221 199 76 490 143 73 237 748 320 188 607 297 232 480 622 287 266 124 297 326 564 408 325 433 180 392 109 313 132 285 139 212 155 120 28 23 232 54 81 87 76 42 102 138 160 131 145 45 118 159 73 103 460 42 13 130 44 314 219 100 10 83 41 77 29 124 15)
284 (3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 3 2 3 3 2 2 3 2 2 3 3 3 3 2 3 3 3 3 3 2 3 3 3 3 3 2 3 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 2 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1))))
287 (DEF DLABS (QUOTE ("GLUFAST" "GLUTEST" "INSTEST" "CCLASS")))
288 (format t "loaded data.~%")
291 ;; Simple univariate variable-specific descriptions.
292 (fivnum absorbtion)
293 (median absorbtion)
294 (sort-data absorbtion)
295 (rank absorbtion)
296 (standard-deviation absorbtion)
297 (interquartile-range absorbtion)
299 (lisp-stat-matrix::bind-columns aluminum iron)
300 (bind-columns aluminum iron)
301 (apply #'bind-columns (list aluminum iron))
302 (lisp-stat-matrix::bind-columns #2a((1 2)(3 4)) #(5 6))
303 (bind-columns #2a((1 2)(3 4)) #(5 6))
306 (defvar fit1 nil)
307 (setf fit1 (regression-model absorbtion iron))
308 (send fit1 :display)
309 (send fit1 :residuals)
311 iron
312 (defvar fit1a nil)
313 (setf fit1a (regression-model absorbtion iron :print nil))
314 (send fit1a :doc)
315 (setf (send fit1a :doc) "this") ;; FIXME: this is a more naturualo
316 (send fit1a :x)
317 (send fit1a :y)
318 (send fit1a :compute)
319 (send fit1a :sweep-matrix)
320 (send fit1a :basis)
321 (send fit1a :residuals)
322 (send fit1a :display)
324 #+nil(progn
325 (array-dimension #2A ((1)) 0)
326 ;; more tests
329 ;;; FIXME: need to get multiple-linear regression working -- clearly
330 ;;; simple linear is working above!
331 (defvar m nil "holding variable.")
332 (def m (regression-model (list iron aluminum) absorbtion :print nil))
333 (send m :compute)
334 (send m :sweep-matrix)
335 (format t "~%~A~%" (send m :sweep-matrix))
336 (send m :display) ;; ERROR...
337 (def m (regression-model (bind-columns iron aluminum) absorbtion))
338 (send m :help)
339 (send m :help :display)
340 (send m :help :basis)
342 (send m :plot-residuals)
345 (typep aluminum 'sequence)
346 (typep iron 'sequence)
347 (matrixp iron)
349 *variables*
351 (variables)
352 (undef 'iron)
353 (variables)
355 ;;; More...