TODO.lisp

   1 ;;; -*- mode: lisp -*-
   2
   3 ;;; Time-stamp: <2009-04-02 15:51:12 tony>
   4 ;;; Creation:   <2008-09-08 08:06:30 tony>
   5 ;;; File:       TODO.lisp
   6 ;;; Author:     AJ Rossini <blindglobe@gmail.com>
   7 ;;; Copyright:  (c) 2007-2008, AJ Rossini <blindglobe@gmail.com>.  BSD.
   8 ;;; Purpose:    Stuff that needs to be made working sits inside the progns...
   9
  10 ;;; What is this talk of 'release'? Klingons do not make software
  11 ;;; 'releases'.  Our software 'escapes', leaving a bloody trail of
  12 ;;; designers and quality assurance people in its wake.
  13
  14 ;;; This file contains the current challenges to solve, including a
  15 ;;; description of the setup and the work to solve....
  16
  17 ;;; SET UP
  18
  19 (in-package :cl-user)
  20 ;;(asdf:oos 'asdf:compile-op 'lispstat)
  21 ;;(asdf:oos 'asdf:load-op 'lispstat)
  22
  23 (in-package :lisp-stat-unittests)
  24
  25 ;; tests = 79, failures = 7, errors = 17
  26
  27 (describe (run-tests :suite 'lisp-stat-ut))
  28 (run-tests :suite 'lisp-stat-ut)
  29
  30 #|
  31   ;; FIXME: Example: currently not relevant, yet
  32   (describe
  33     (lift::run-test
  34       :test-case  'lisp-stat-unittests::create-proto
  35       :suite 'lisp-stat-unittests::lisp-stat-ut-proto))
  36 |#
  37
  38 (describe 'lisp-stat-ut)
  39 (in-package :ls-user)
  40
  41
  42 (progn ;; dataframe
  43
  44   (describe (lift::run-tests :suite 'lisp-stat-ut-dataframe))
  45   (lift::run-tests :suite 'lisp-stat-ut-dataframe)
  46
  47   (describe
  48     (lift::run-test
  49       :test-case  'lisp-stat-unittests::create-proto
  50       :suite 'lisp-stat-unittests::lisp-stat-ut-proto))
  51
  52   (defparameter *my-df-1*
  53         (make-instance 'dataframe-array
  54                        :storage #2A((1 2 3 4 5)
  55                                     (10 20 30 40 50))
  56                        :doc "This is an interesting dataframe-array"
  57                        :case-labels (list "x" "y")
  58                        :var-labels (list "a" "b" "c" "d" "e")))
  59
  60   (setf (dfref *my-df-1* 0 0) -1d0)
  61
  62
  63
  64   (make-dataframe  #2A((1 2 3 4 5)
  65                        (10 20 30 40 50)))
  66
  67   (make-dataframe (rand 4 3))
  68
  69
  70   (equalp (dataset
  71           (make-instance 'dataframe-array
  72                          :storage #2A(('a 'b)
  73                                       ('c 'd))))
  74                  #2A(('a 'b)
  75                      ('c 'd)) )
  76
  77   (equalp (dataset
  78           (make-instance 'dataframe-array
  79                          :storage #2A((1 2)
  80                                       (3 4))))
  81                  #2A((1 2)
  82                      (3 4)))
  83
  84   (equalp (dataset
  85           (make-instance 'dataframe-array
  86                          :storage #2A((1d0 2d0)
  87                                       (3d0 4d0))))
  88                  #2A((1d0 2d0)
  89                      (3d0 4d0)))
  90
  91
  92   (defparameter *my-df-1*
  93     (make-dataframe  #2A((1 2 3 4 5)
  94                          (10 20 30 40 50))
  95                      :caselabels (list "x" "y")
  96                      :varlabels (list "a" "b" "c" "d" "e")
  97                      :doc "This is an interesting dataframe-array"))
  98
  99   (caselabels *my-df-1*)
 100   (varlabels *my-df-1*)
 101
 102
 103   (defparameter *my-df-2*
 104         (make-instance 'dataframe-array
 105                        :storage
 106                        (make-array-from-listoflists
 107                         (cybertiggyr-dsv::load-escaped
 108                          "/media/disk/Desktop/sandbox/CLS.git/Data/example-mixed.csv"))
 109                        :doc "This is an interesting dataframe-array"))
 110 #|                     :case-labels (list "x" "y")
 111                        :var-labels (list "a" "b" "c" "d" "e")
 112 |#
 113
 114
 115   )
 116
 117 (progn ;; Data setup
 118
 119   (describe 'make-matrix)
 120
 121   (defparameter *indep-vars-2-matrix*
 122     (make-matrix (length iron) 2
 123                  :initial-contents
 124                  (mapcar #'(lambda (x y)
 125                              (list (coerce x 'double-float)
 126                                    (coerce y 'double-float)))
 127                          iron aluminum)))
 128
 129
 130   (defparameter *dep-var*
 131     (make-vector (length absorbtion)
 132                  :type :row
 133                  :initial-contents
 134                  (list
 135                   (mapcar #'(lambda (x) (coerce x 'double-float))
 136                           absorbtion))))
 137
 138   (make-dataframe *dep-var*)
 139   (make-dataframe (transpose *dep-var*))
 140
 141   (defparameter *dep-var-int*
 142     (make-vector (length absorbtion)
 143                  :type :row
 144                  :element-type 'integer
 145                  :initial-contents (list absorbtion)))
 146
 147
 148   (defparameter *xv+1a*
 149     (make-matrix
 150      8 2
 151      :initial-contents #2A((1d0 1d0)
 152                            (1d0 3d0)
 153                            (1d0 2d0)
 154                            (1d0 4d0)
 155                            (1d0 3d0)
 156                            (1d0 5d0)
 157                            (1d0 4d0)
 158                            (1d0 6d0))))
 159
 160   (defparameter *xv+1b*
 161     (bind2
 162      (ones 8 1)
 163      (make-matrix
 164       8 1
 165       :initial-contents '((1d0)
 166                           (3d0)
 167                           (2d0)
 168                           (4d0)
 169                           (3d0)
 170                           (5d0)
 171                           (4d0)
 172                           (6d0)))
 173      :by :column))
 174
 175   (m= *xv+1a* *xv+1b*) ; => T
 176
 177   (princ "Data Set up"))
 178
 179
 180
 181
 182 (progn
 183   ;; REVIEW: general Lisp use guidance
 184
 185   (fdefinition 'make-matrix)
 186   (documentation 'make-matrix 'function)
 187
 188 #| Examples from CLHS, a bit of guidance.
 189
 190   ;; This function assumes its callers have checked the types of the
 191   ;; arguments, and authorizes the compiler to build in that assumption.
 192   (defun discriminant (a b c)
 193    (declare (number a b c))
 194    "Compute the discriminant for a quadratic equation."
 195    (- (* b b) (* 4 a c))) =>  DISCRIMINANT
 196   (discriminant 1 2/3 -2) =>  76/9
 197
 198   ;; This function assumes its callers have not checked the types of the
 199   ;; arguments, and performs explicit type checks before making any assumptions.
 200  (defun careful-discriminant (a b c)
 201    "Compute the discriminant for a quadratic equation."
 202    (check-type a number)
 203    (check-type b number)
 204    (check-type c number)
 205    (locally (declare (number a b c))
 206      (- (* b b) (* 4 a c)))) =>  CAREFUL-DISCRIMINANT
 207  (careful-discriminant 1 2/3 -2) =>  76/9
 208 |#
 209   )
 210
 211
 212 #+nil
 213 (progn ;; FIXME: Regression modeling
 214
 215   ;; data setup in previous FIXME
 216   (defparameter  *m* nil
 217     "holding variable.")
 218   ;; need to make vectors and matrices from the lists...
 219
 220   ;; BROKEN
 221   (def *m* (regression-model (list->vector-like iron)
 222                              (list->vector-like absorbtion)))
 223
 224   (def m (regression-model (list->vector-like iron)
 225                            (list->vector-like absorbtion) :print nil))
 226                            ;;Good
 227   (send m :print)
 228   (send m :own-slots)
 229   (send m :own-methods)
 230   ;; (lsos::ls-objects-methods m) ; bogus?
 231   (send m :show)
 232
 233   (def m (regression-model (list->vector-like iron)
 234                            (list->vector-like absorbtion)))
 235
 236   (def m (regression-model (listoflists->matrix-like  (list iron aluminum))
 237                            (list->vector-like  absorbtion) :print nil))
 238
 239
 240   (send m :compute)
 241   (send m :sweep-matrix)
 242   (format t "~%~A~%" (send m :sweep-matrix))
 243
 244   ;; need to get multiple-linear regression working (simple linear regr
 245   ;; works)... to do this, we need to redo the whole numeric structure,
 246   ;; I'm keeping these in as example of brokenness...
 247
 248   (send m :basis) ;; this should be positive?
 249   (send m :coef-estimates)  )
 250
 251 #+nil
 252 (progn ;; FIXME: Need to clean up data examples, licenses, attributions, etc.
 253   ;; The following breaks because we should use a package to hold
 254   ;; configuration details, and this would be the only package outside
 255   ;; of packages.lisp, as it holds the overall defsystem structure.
 256   (load-data "iris.lsp")  ;; (the above partially fixed).
 257   (variables)
 258   diabetes )
 259
 260
 261
 262
 263 (progn ;; FIXME: read data from CSV file.  To do.
 264
 265
 266   ;; challenge is to ensure that we get mixed arrays when we want them,
 267   ;; and single-type (simple) arrays in other cases.
 268
 269
 270   (defparameter *csv-num*
 271     (cybertiggyr-dsv::load-escaped
 272      #p"/media/disk/Desktop/sandbox/CLS.git/Data/example-numeric.csv"
 273      :field-separator #\,
 274      :trace T))
 275
 276   (nth 0 (nth 0 *csv-num*))
 277
 278   (defparameter *csv-num*
 279     (cybertiggyr-dsv::load-escaped
 280      #p"/media/disk/Desktop/sandbox/CLS.git/Data/example-numeric2.dsv"
 281      :field-separator #\:))
 282
 283   (nth 0 (nth 0 *csv-num*))
 284
 285
 286   ;; The handling of these types should be compariable to what we do for
 287   ;; matrices, but without the numerical processing.  i.e. mref, bind2,
 288   ;; make-dataframe, and the class structure should be similar.
 289
 290   ;; With numerical data, there should be a straightforward mapping from
 291   ;; the data.frame to a matrix.   With categorical data (including
 292   ;; dense categories such as doc-strings, as well as sparse categories
 293   ;; such as binary data), we need to include metadata about ordering,
 294   ;; coding, and such.  So the structures should probably consider
 295
 296   ;; Using the CSV file:
 297
 298   (defun parse-number (s)
 299     (let* ((*read-eval* nil)
 300            (n (read-from-string s)))
 301       (if (numberp n) n)))
 302
 303   (parse-number "34")
 304   (parse-number "34 ")
 305   (parse-number " 34")
 306   (parse-number " 34 ")
 307
 308   (+  (parse-number "3.4") 3)
 309   (parse-number "3.4 ")
 310   (parse-number " 3.4")
 311   (+  (parse-number " 3.4 ") 3)
 312
 313   (parse-number "a")
 314
 315   ;; (coerce "2.3" 'number)  => ERROR
 316   ;; (coerce "2" 'float)  => ERROR
 317
 318   (defparameter *csv-num*
 319     (cybertiggyr-dsv::load-escaped
 320      #p"/media/disk/Desktop/sandbox/CLS.git/Data/example-numeric.csv"
 321      :field-separator #\,
 322      :filter #'parse-number
 323      :trace T))
 324
 325   (nth 0 (nth 0 *csv-num*))
 326
 327   (defparameter *csv-num*
 328     (cybertiggyr-dsv::load-escaped
 329      #p"/media/disk/Desktop/sandbox/CLS.git/Data/example-numeric2.dsv"
 330      :field-separator #\:
 331      :filter #'parse-number))
 332
 333   (nth 0 (nth 0 *csv-num*))
 334
 335   ;; now we've got the DSV code in the codebase, auto-loaded I hope:
 336   cybertiggyr-dsv:*field-separator*
 337   (defparameter *example-numeric.csv*
 338     (cybertiggyr-dsv:load-escaped "Data/example-numeric.csv"
 339                                   :field-separator #\,))
 340   *example-numeric.csv*
 341
 342   ;; the following fails because we've got a bit of string conversion
 343   ;; to do.   2 thoughts: #1 modify dsv package, but mucking with
 344   ;; encapsulation.  #2 add a coercion tool (better, but potentially
 345   ;; inefficient).
 346   #+nil(coerce  (nth 3 (nth 3 *example-numeric.csv*)) 'double-float)
 347
 348   ;; cases, simple to not so
 349   (defparameter *test-string1* "1.2")
 350   (defparameter *test-string2* " 1.2")
 351   (defparameter *test-string3* " 1.2 ")
 352   )
 353
 354
 355 #+nil
 356 (progn ;; experiments with GSL and the Lisp interface.
 357   (asdf:oos 'asdf:load-op 'gsll)
 358   (asdf:oos 'asdf:load-op 'gsll-tests)
 359
 360   ;; the following should be equivalent
 361   (setf *t1*  (LIST 6.18d0 6.647777777777779d0 6.18d0))
 362   (setf *t2*  (MULTIPLE-VALUE-LIST
 363                (LET ((VEC
 364                       (gsll:make-marray 'DOUBLE-FLOAT
 365                                         :INITIAL-CONTENTS '(-3.21d0 1.0d0 12.8d0)))
 366                      (WEIGHTS
 367                       (gsll:MAKE-MARRAY 'DOUBLE-FLOAT
 368                                         :INITIAL-CONTENTS '(3.0d0 1.0d0 2.0d0))))
 369                  (LET ((MEAN (gsll:MEAN VEC)))
 370                    (LIST (gsll:ABSOLUTE-DEVIATION VEC)
 371                          (gsll:WEIGHTED-ABSOLUTE-DEVIATION VEC WEIGHTS)
 372                          (gsll:ABSOLUTE-DEVIATION VEC MEAN))))))
 373   (eql *t1* *t2*)
 374
 375   ;; from (gsll:examples 'gsll::numerical-integration) ...
 376   (gsll:integration-qng gsll::one-sine 0.0d0 PI)
 377
 378   (gsll:defun-single axpb (x) (+ (* 2 x) 3)) ;; a<-2, b<-3
 379   (gsll:integration-qng axpb 1d0 2d0)
 380
 381   (let ((a 2)
 382         (b 3))
 383     (defun-single axpb2 (x) (+ (* a x) b)))
 384   (gsll:integration-qng axpb2 1d0 2d0)
 385
 386   ;;   BAD
 387   ;;   (gsll:integration-qng
 388   ;;    (let ((a 2)
 389   ;;     (b 3))
 390   ;;      (defun-single axpb2 (x) (+ (* a x) b)))
 391   ;;    1d0 2d0)
 392
 393   ;; right, but weird expansion...
 394   (gsll:integration-qng
 395    (let ((a 2)
 396          (b 3))
 397      (defun axpb2 (x) (+ (* a x) b))
 398      (gsll:def-single-function axpb2)
 399      axpb2)
 400    1d0 2d0)
 401
 402   ;; Linear least squares
 403
 404   (gsll:gsl-lookup "gsl_linalg_LU_decomp") ; => gsll:lu-decomposition
 405   (gsll:gsl-lookup "gsl_linalg_LU_solve") ; => gsll:lu-solve
 406   )
 407
 408
 409
 410 #+nil
 411 (progn ;; philosophy time
 412
 413   (setf my-model (model :name "ex1"
 414                         :data-slots (list w x y z)
 415                         :param-slots (list alpha beta gamma)
 416                         :math-form (regression-model :formula '(= w (+ (* beta x)
 417                                                                      (* alpha y)
 418                                                                      (* gamma z)
 419                                                                      normal-error))
 420                                                      :centrality 'median ; 'mean
 421                                                      )))
 422
 423 #| or:
 424   #R"W ~ x+  y + z "
 425 |#
 426
 427   (setf my-dataset (statistical-table :table data-frame-contents
 428                                       :metadata (list (:case-names (list ))
 429                                                       (:var-names (list ))
 430                                                       (:documentation "string of doc"))))
 431
 432   (setf my-analysis (analysis
 433                      :model my-model
 434                      :data my-dataset
 435                      :parameter-map (pairing (model-param-slots my-model)
 436                                              (data-var-names my-dataset))))
 437
 438   ;; ontological implications -- the analysis is an abstract class of
 439   ;; data, model, and mapping between the model and data.  The fit is
 440   ;; the instantiation of such.  This provides a statistical object
 441   ;; computation theory which can be realized as "executable
 442   ;; statistics" or "computable statistics".
 443   (setf my-analysis (analyze my-fit
 444                              :estimation-method 'linear-least-squares-regression))
 445
 446   ;; one of the tricks here is that one needs to provide the structure
 447   ;; from which to consider estimation, and more importantly, the
 448   ;; validity of the estimation.
 449
 450   ;;
 451   (setf linear-least-squares-regression
 452         (estimation-method-definition
 453          :variable-defintions ((list
 454                                 ;; from MachLearn: supervised,
 455                                 ;; unsupervised
 456                                 :data-response-vars list-drv ; nil if unsup
 457                                 ;;
 458                                 :param-vars list-pv
 459                                      :data-predictor-vars list-dpv
 460                                      ;; nil in this case.  these
 461                                      ;; describe "out-of-box" specs
 462                                      :hyper-vars list-hv))
 463          :form '(regression-additive-error
 464                  :central-form (linear-form drv pv dpv)
 465                  :error-form 'normal-error)
 466          :resulting-decision '(point-estimation interval-estimation)
 467          :philosophy 'frequentist
 468          :documentation "use least squares to fit a linear regression
 469                          model to data."))
 470
 471   (defparameter *statistical-philosophies*
 472     '(frequentist bayesian fiducial decision-analysis)
 473     "can be combined to build decision-making approaches and
 474     characterizations")
 475
 476   (defparameter *decisions*
 477     '(estimation selection testing)
 478     "possible results from a...")
 479   ;; is this really true?  One can embedded hypothesis testing within
 480   ;; estimation, as the hypothesis estimated to select.  And
 481   ;; categorical/continuous rear their ugly heads, but not really in
 482   ;; an essential way.
 483
 484   (defparameter *ontology-of-decision-procedures*
 485     (list :decisions
 486           (list :estimation
 487                 (list :point
 488                       (list :maximum-likelihood
 489                             :minimum-entropy
 490                             :least-squares
 491                             :method-of-moments)
 492                       :interval
 493                       (list :maximum-likelihood
 494                             :))
 495                 :testing
 496                 (list :fisherian
 497                       :neyman-pearson
 498                       (list :traditional
 499                             :bioequivalence-inversion)
 500                       :selection
 501                       (list :ranking
 502                             :top-k-of-n-select))
 503                 :parametric
 504                 :partially-parametric))
 505     "start of ontology"))
 506
 507
 508 ;;;; LM
 509
 510 (progn
 511
 512   (defparameter *y*
 513     (make-vector
 514      8
 515      :type :row
 516      :initial-contents '((1d0 2d0 3d0 4d0 5d0 6d0 7d0 8d0))))
 517
 518
 519   (defparameter *xv+1*
 520     (make-matrix
 521      8 2
 522      :initial-contents '((1d0 1d0)
 523                          (1d0 3d0)
 524                          (1d0 2d0)
 525                          (1d0 4d0)
 526                          (1d0 3d0)
 527                          (1d0 5d0)
 528                          (1d0 4d0)
 529                          (1d0 6d0))))
 530
 531
 532   ;; so something like (NOTE: matrices are transposed to begin with, hence the incongruety)
 533   (defparameter *xtx-2* (m* (transpose *xv+1*) *xv+1*))
 534   ;; #<LA-SIMPLE-MATRIX-DOUBLE  2 x 2
 535   ;;  8.0d0 28.0d0
 536   ;;  28.0d0 116.0d0>
 537
 538   (defparameter *xty-2* (m* (transpose *xv+1*)  (transpose *y*)))
 539   ;; #<LA-SIMPLE-VECTOR-DOUBLE (2 x 1)
 540   ;;  36.0d0
 541   ;;  150.0d0>
 542
 543   (defparameter *rcond-2* 0.000001)
 544   (defparameter *betahat-2*  (gelsy *xtx-2* *xty-2* *rcond-2*))
 545   ;; *xtx-2* => "details of complete orthogonal factorization"
 546   ;; according to man page:
 547   ;; #<LA-SIMPLE-MATRIX-DOUBLE  2 x 2
 548   ;;  -119.33147112141039d0 -29.095426104883202d0
 549   ;;  0.7873402682880205d0 -1.20672274167718d0>
 550
 551   ;; *xty-2* => output becomes solution:
 552   ;; #<LA-SIMPLE-VECTOR-DOUBLE (2 x 1)
 553   ;;  -0.16666666666668312d0
 554   ;;  1.333333333333337d0>
 555
 556   *betahat-2* ; which matches R, see below
 557
 558   (documentation 'gelsy 'function)
 559
 560
 561 ;;   (#<LA-SIMPLE-VECTOR-DOUBLE (2 x 1)
 562 ;;    -0.16666666666668312 1.333333333333337>
 563 ;;    2)
 564
 565 ;;   ## Test case in R:
 566 ;;   x <- c( 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0)
 567 ;;   y <- c( 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0)
 568 ;;   lm(y~x)
 569 ;;   ## => Call:  lm(formula = y ~ x)
 570
 571 ;;   Coefficients:  (Intercept)            x
 572 ;;                      -0.1667       1.3333
 573
 574 ;;   summary(lm(y~x))
 575 ;;   ## =>
 576
 577 ;;   Call:
 578 ;;   lm(formula = y ~ x)
 579
 580 ;;   Residuals:
 581 ;;          Min         1Q     Median         3Q        Max
 582 ;;   -1.833e+00 -6.667e-01 -3.886e-16  6.667e-01  1.833e+00
 583
 584 ;;   Coefficients:
 585 ;;               Estimate Std. Error t value Pr(>|t|)
 586 ;;   (Intercept)  -0.1667     1.1587  -0.144  0.89034
 587 ;;   x             1.3333     0.3043   4.382  0.00466 **
 588 ;;   ---
 589 ;;   Signif. codes:  0 ‘***’ 0.001 ‘**’ 0.01 ‘*’ 0.05 ‘.’ 0.1 ‘ ’ 1
 590
 591 ;;   Residual standard error: 1.291 on 6 degrees of freedom
 592 ;;   Multiple R-squared: 0.7619,        Adjusted R-squared: 0.7222
 593 ;;   F-statistic:  19.2 on 1 and 6 DF,  p-value: 0.004659
 594
 595
 596
 597   ;; which suggests one might do (modulo ensuring correct
 598   ;; orientations).  When this is finalized, it should migrate to
 599   ;; CLS.
 600   ;;
 601
 602
 603   (defparameter *n* 20) ; # rows = # obsns
 604   (defparameter *p* 10) ; # cols = # vars
 605   (defparameter *x-temp*  (rand *n* *p*))
 606   (defparameter *b-temp*  (rand *p* 1))
 607   (defparameter *y-temp*  (m* *x-temp* *b-temp*))
 608   ;; so Y=Xb + \eps
 609   (defparameter *rcond* (* (coerce (expt 2 -52) 'double-float)
 610                    (max (nrows *x-temp*) (ncols *y-temp*))))
 611   (defparameter *orig-x* (copy *x-temp*))
 612   (defparameter *orig-b* (copy *b-temp*))
 613   (defparameter *orig-y* (copy *y-temp*))
 614
 615   (defparameter *lm-result* (lm *x-temp* *y-temp*))
 616   (princ (first *lm-result*))
 617   (princ (second *lm-result*))
 618   (princ (third *lm-result*))
 619   (v= (third *lm-result*)
 620       (v- (first (first *lm-result*))
 621           (first  (second *lm-result*))))
 622
 623
 624
 625
 626   ;; Some issues exist in the LAPACK vs. LINPACK variants, hence R
 627   ;; uses LINPACK primarily, rather than LAPACK.  See comments in R
 628   ;; source for issues.
 629
 630
 631   ;; Goal is to start from X, Y and then realize that if
 632   ;; Y = X \beta, then,   i.e. 8x1 = 8xp px1  + 8x1
 633   ;;      XtX \hat\beta = Xt Y
 634   ;; so that we can solve the equation  W \beta = Z   where W and Z
 635   ;; are known, to estimate \beta.
 636
 637   ;; the above is known to be numerically instable -- some processing
 638   ;; of X is preferred and should be done prior.  And most of the
 639   ;; transformation-based work does precisely that.
 640
 641   ;; recall:  Var[Y] = E[(Y - E[Y])(Y-E[Y])t]
 642   ;;   = E[Y Yt] - 2 \mu \mut + \mu \mut
 643   ;;   = E[Y Yt] - \mu \mut
 644
 645   ;; Var Y = E[Y^2] - \mu^2
 646
 647
 648   ;; For initial estimates of covariance of \hat\beta:
 649
 650   ;; \hat\beta = (Xt X)^-1 Xt Y
 651   ;; with E[ \hat\beta ]
 652   ;;        = E[ (Xt X)^-1 Xt Y ]
 653   ;;        = E[(Xt X)^-1 Xt (X\beta)]
 654   ;;        = \beta
 655   ;;
 656   ;; So Var[\hat\beta] = ...
 657   ;;     (Xt X)
 658   ;; and this gives SE(\beta_i) = (* (sqrt (mref Var i i)) adjustment)
 659
 660
 661   ;; from docs:
 662
 663   (setf *temp-result*
 664         (let ((*default-implementation* :foreign-array))
 665           (let* ((m 10)
 666                  (n 10)
 667                  (a (rand m n))
 668                  (x (rand n 1))
 669                  (b (m* a x))
 670                  (rcond (* (coerce (expt 2 -52) 'double-float)
 671                            (max (nrows a) (ncols a))))
 672                  (orig-a (copy a))
 673                  (orig-b (copy b))
 674                  (orig-x (copy x)))
 675             (list x (gelsy a b rcond))
 676             ;; no applicable conversion?
 677             ;; (m-   (#<FA-SIMPLE-VECTOR-DOUBLE (10 x 1))
 678             ;;       (#<FA-SIMPLE-VECTOR-DOUBLE (10 x 1)) )
 679             (v- x (first (gelsy a b rcond))))))
 680
 681
 682   (princ *temp-result*)
 683
 684   (setf *temp-result*
 685         (let ((*default-implementation* :lisp-array))
 686           (let* ((m 10)
 687                  (n 10)
 688                  (a (rand m n))
 689                  (x (rand n 1))
 690                  (b (m* a x))
 691                  (rcond (* (coerce (expt 2 -52) 'double-float)
 692                            (max (nrows a) (ncols a))))
 693                  (orig-a (copy a))
 694                  (orig-b (copy b))
 695                  (orig-x (copy x)))
 696             (list x (gelsy a b rcond))
 697             (m- x (first  (gelsy a b rcond)))
 698             )))
 699   (princ *temp-result*)
 700
 701
 702   (defparameter *xv*
 703     (make-vector
 704      8
 705      :type :row ;; default, not usually needed!
 706      :initial-contents '((1d0 3d0 2d0 4d0 3d0 5d0 4d0 6d0))))
 707
 708   (defparameter *y*
 709     (make-vector
 710      8
 711      :type :row
 712      :initial-contents '((1d0 2d0 3d0 4d0 5d0 6d0 7d0 8d0))))
 713
 714   ;; so something like (NOTE: matrices are transposed to begin with, hence the incongruety)
 715   (defparameter *xtx-1* (m* *xv* (transpose *xv*)))
 716   (defparameter *xty-1* (m* *xv* (transpose  *y*)))
 717   (defparameter *rcond-in* (* (coerce (expt 2 -52) 'double-float)
 718                               (max (nrows *xtx-1*)
 719                                    (ncols *xty-1*))))
 720
 721   (defparameter *betahat*  (gelsy *xtx-1* *xty-1* *rcond-in*))
 722
 723   ;;  (#<LA-SIMPLE-VECTOR-DOUBLE (1 x 1)
 724   ;;  1.293103448275862>
 725   ;;  1)
 726
 727   ;;   ## Test case in R:
 728   ;;   x <- c( 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0)
 729   ;;   y <- c( 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 8.0)
 730   ;;   lm(y~x-1)
 731   ;;   ## =>
 732   ;;   Call:
 733   ;;   lm(formula = y ~ x - 1)
 734
 735   ;;   Coefficients:
 736   ;;       x
 737   ;;   1.293
 738
 739   (first  *betahat*))
 740
 741
 742
 743 #+nil
 744 (progn
 745
 746   (asdf:oos 'asdf:load-op 'cl-plplot)
 747
 748   (plot-ex))
 749
 750 #|
 751
 752   (type-of #2A((1 2 3 4 5)
 753                        (10 20 30 40 50)))
 754
 755   (type-of (rand 10 20))
 756
 757   (typep #2A((1 2 3 4 5)
 758              (10 20 30 40 50))
 759          'matrix-like)
 760
 761   (typep (rand 10 20) 'matrix-like)
 762
 763   (typep #2A((1 2 3 4 5)
 764              (10 20 30 40 50))
 765          'array)
 766
 767   (typep (rand 10 20) 'array)
 768
 769 |#