//::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::
/** @author  John Miller
 *  @version 1.6
 *  @date    Sat Jan  9 21:48:57 EST 2016
 *  @see     LICENSE (MIT style license file).
 *
 *  @title   Model: Linear Discriminant Analysis (LDA) Classifier
 *
 *  FIX - extend the code to work for k > 2.
 */

package scalation.analytics
package classifier

import scala.math.log

import scalation.linalgebra.{MatriD, MatrixD, VectoD, VectorD, VectoI, VectorI}
import scalation.plot.Plot
import scalation.util.banner

//::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::
/** The `LDA` class implements a Linear Discriminant Analysis 'LDA' classifier.
 *  It places a vector into a group according to its maximal discriminant function.
 *  FIX - currently only works when the number of classes 'k' = 2.
 *  @see en.wikipedia.org/wiki/Linear_discriminant_analysis
 *  @param x       the real-valued training/test data vectors stored as rows of a matrix
 *  @param y       the training/test classification vector, where y_i = class for row i of the matrix x
 *  @param fn_     the names for all features/variables
 *  @param k       the number of classes (k in {0, 1, ...k-1}
 *  @param cn_     the names for all classes
 *  @param hparam  the hyper-parameters
 */
class LDA (x: MatriD, y: VectoI, fn_ : Strings = null, k: Int = 2, cn_ : Strings = null,
           hparam: HyperParameter = null)
      extends ClassifierReal (x, y, fn_, k, cn_, hparam)
{
    private val DEBUG = false                                                      // debug flag
    private val x1 = (MatrixD (for (i <- x.range1 if y(i) == 0) yield x(i))).t     // group 1
    private val x2 = (MatrixD (for (i <- x.range1 if y(i) == 1) yield x(i))).t     // group 2

    if (k != 2) flaw ("constructor", "k must equal 2 in current implementation")

    if (DEBUG) {
        banner ("grouped matrices")
        println ("x1 = " + x1)
        println ("x2 = " + x2)
//      new Plot (x1.col(0), x1.col(1), null, "matrix x1")
//      new Plot (x2.col(0), x2.col(1), null, "matrix x2")
    } // if

    private val mu  = (x1.mean, x2.mean, x.mean)                   // means
    private val xc0 = x1 - mu._3                                   // corrected group matrix 1
    private val xc1 = x2 - mu._3                                   // corrected group matrix 2

    private var pcovar: MatriD  = null                             // pooled covariance matrix
    private var ipcovar: MatriD = null                             // inverse of pooled covariance matrix
    private var prior: VectoD   = null                             // prior probabilities

    if (DEBUG) {
        banner ("corrected grouped matrices")
        println ("xc0   = " + xc0)
        println ("xc1   = " + xc1)
        banner ("their mean vectors and covariance matrices")
        println ("mu    = " + mu)
    } // if

    //::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::
    /** Compute the corrected covariance matrix.
     *  @param xc  the corrected martix whose corrected covariance matrix is sought 
     */
    def corrected_cov (xc: MatriD): MatriD = (xc.t * xc) / xc.dim1

    //::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::
    /** Train the classifer by computing 'pcovar', 'ipcovar' and 'prior'
     *  that are needed to compute the discriminant functions 'f'.
     *  These are computed in the 'classify' method.
     *  @param itest  the indices of the test data - FIX - not used yet
     */
    def train (itest: VectorI): LDA =
    {
        val w1    = x1.dim1 / x.dim1.toDouble                      // first weigth
        val w2    = 1.0 - w1                                       // second weigth
        val covar = (corrected_cov (xc0), corrected_cov (xc1))     // corrected covariances
        prior     = VectorD (w1, w2)                               // prior probabilities
        pcovar    = covar._1 * w1 + covar._2 * w2                  // pooled covariance matrix
        ipcovar   = pcovar.inverse                                 // inverse of pooled covariance matrix   
        if (DEBUG) {
            banner ("pooled covariance and it inverse")
            println ("covar   = " + covar)
            println ("pcovar  = " + pcovar)
            println ("ipcovar = " + ipcovar)
            println ("prior   = " + prior)
        } // if
        this
    } // train

    //::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::
    /** Return the vector of model parameter vector.
     */
    def parameter: VectoD = null                                    // FIX - to be implemented

    //::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::
    /** Classify vector 'z' by computing its discriminant function 'f' for each
     *  group and return the group index with the maximun value for 'f'.
     */
    override def classify (z: VectoD): (Int, String, Double) =
    {
        val fvec = (ipcovar * mu._1, ipcovar * mu._2)
        val f    = ((fvec._1 dot z) - 0.5 * (fvec._1 dot mu._1) + log (prior(0)),
                    (fvec._2 dot z) - 0.5 * (fvec._2 dot mu._2) + log (prior(1)))
        if (DEBUG) println ("f = " + f)
        if (f._1 > f._2) (0, cn(0), 0.0) else (1, cn(1), 1.0)
    } // classify

    //::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::
    /** Reset method not applicable.
     */
    def reset (): Unit = { /* Not Applicable */ }

} // LDA class


//::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::::
/** The `LDATest` is used to test the `LDA` class.
 *  @see people.revoledu.com/kardi/tutorial/LDA/Numerical%20Example.html
 *  > runMain scalation.analytics.classifier.LDATest
 */
object LDATest extends App
{
    // features/variable: 
    // x1: curvature
    // x2: diameter
    //                           x1    x2
    val x = new MatrixD ((7, 2), 2.95, 6.63,
                                 2.53, 7.79,
                                 3.57, 5.65,
                                 3.16, 5.47,
                                 2.58, 4.46,
                                 2.16, 6.22,
                                 3.27, 3.52)
    val y = VectorI (0, 0, 0, 0, 1, 1, 1)

    val fn = Array ("curvature", "diameter")                   // feature names
    val cn = Array ("pass", "fail")                            // class names

    val lda = new LDA (x, y, fn, 2, cn)                        // create the LDA classifier
    lda.train ()                                               // train the classifier
    val yp = lda.classify (x)                                  // classify all instances
    lda.confusion (yp)                                         // create confusion matrix and QoF measures

    banner ("LDA Results")
    lda.contrast (yp)
    println (lda.report)
    println (lda.summary (lda.parameter))

    banner ("classify")
    val z  = VectorD (2.81, 5.46)
    println (s"classify ($z) = ${lda.classify (z)}")

    val t = VectorD.range (0, x.dim1)
    new Plot (t, y.toDouble, yp.toDouble, "y(black)/yp(red) vs. t")
    new Plot (x.col(0), y.toDouble, yp.toDouble, "y(black)/yp(red) vs. x1")
    new Plot (x.col(1), y.toDouble, yp.toDouble, "y(black)/yp(red) vs. x2")

} // LDATestObject