fixes to SFileSource

jcanny · jcanny · commit 1ff00a961f8d · 2017-06-13T01:14:48.000-07:00
diff --git a/src/main/scala/BIDMach/Learner.scala b/src/main/scala/BIDMach/Learner.scala
@@ -182,7 +182,8 @@ case class Learner(
           while (paused) Thread.sleep(1000);
           if (updater != null) updater.update(ipass, here, gprogress);
         }
-        val scores = model.evalbatchg(mats, ipass, here);
+        val tmpscores = model.evalbatchg(mats, ipass, here);
+        val scores = if (tmpscores.ncols > 1) mean(tmpscores, 2) else tmpscores;
         if (datasink != null) datasink.put;
         reslist.append(scores.newcopy)
         samplist.append(here)
@@ -312,7 +313,8 @@ case class Learner(
       here += datasource.opts.batchSize
       bytes += mats.map(Learner.numBytes _).reduce(_+_);
       nsamps += mats(0).ncols;
-      val scores = model.evalbatchg(mats, 0, here);
+      val tmpscores = model.evalbatchg(mats, 0, here);
+      val scores = if (tmpscores.ncols > 1) mean(tmpscores,2) else tmpscores;
       if (datasink != null) datasink.put
       reslist.append(scores.newcopy);
       samplist.append(here);
@@ -562,7 +564,20 @@ case class ParLearner(
       Learner.toCPU(models(0).modelmats)
       resetGPUs
     }
-    println("Time=%5.4f secs, gflops=%4.2f, samples=%4.2g, MB/sec=%4.2g" format (gf._2, gf._1, 1.0*opts.nthreads*here, bytes/gf._2/1e6))
+    val perfStr = ("%5.2f%%, score=%6.5f, secs=%3.1f, samps/s=%4.1f, gf=%4.1f, MB/s=%4.1f" format (
+    		           100f*lastp,
+    		           Learner.scoreSummary(reslist, lasti, reslist.length, opts.cumScore),
+    		           gf._1,
+    		           gf._2,
+    		           bytes*1e9,
+    		           bytes/gf._2*1e-6));
+    val gpuStr = if (useGPU) {
+    	             (0 until math.min(opts.nthreads, Mat.hasCUDA)).map((i)=>{
+    	            	 setGPU(i);
+    	            	 if (i==0) (", GPUmem=%3.2f" format GPUmem._1) else (", %3.2f" format GPUmem._1)
+    	             });
+    } else "";
+    myLogger.info(perfStr + gpuStr);
     results = Learner.scores2FMat(reslist) on row(samplist.toList)
   }
 
diff --git a/src/main/scala/BIDMach/datasources/SFileSource.scala b/src/main/scala/BIDMach/datasources/SFileSource.scala
@@ -60,7 +60,7 @@ class SFileSource(override val opts:SFileSource.Opts = new SFileSource.Options)
     val omat = omat0.asInstanceOf[SMat]
     val ioff = Mat.ioneBased
     var idone = done
-    var innz = omat.nnz
+    var onnz = 0;//omat.nnz
     val lims = fcounts
     val nfiles = fcounts.length
     val addConstFeat = opts.addConstFeat
@@ -73,7 +73,7 @@ class SFileSource(override val opts:SFileSource.Opts = new SFileSource.Options)
         val mat = inmat(j).asInstanceOf[SMat];
         var k = mat.jc(icol) - ioff;
         var lastk = mat.jc(icol+1) - ioff;
-        val xoff = innz - k;
+        val xoff = onnz - k;
  //       println("here %d %d %d %d %d" format (k, mat.nrows, mat.ncols, lims.length, j))
         while (k < lastk && mat.ir(k)-ioff < lims(j)) {
           if (xoff + k >= omat.ir.length) {
@@ -89,19 +89,19 @@ class SFileSource(override val opts:SFileSource.Opts = new SFileSource.Options)
           }
           k += 1;
         }
-        innz = xoff + k
+        onnz = xoff + k
         j += 1
       }
       icol += 1
       idone += 1
       if (addConstFeat) {
-        omat.ir(innz) = omat.nrows - 1 + ioff
-        omat.data(innz) = 1
-        innz += 1
+        omat.ir(onnz) = omat.nrows - 1 + ioff
+        omat.data(onnz) = 1
+        onnz += 1
       }
-      omat.jc(idone) = innz + ioff
+      omat.jc(idone) = onnz + ioff
     }
-    omat.nnz0 = innz
+    omat.nnz0 = onnz
     omat    
   }
   
diff --git a/src/main/scala/BIDMach/models/FM.scala b/src/main/scala/BIDMach/models/FM.scala
@@ -196,8 +196,7 @@ class FM(override val opts:FM.Opts = new FM.Options) extends RegressionModel(opt
   }
   
   def meval(in:Mat):FMat = {
-    val targs = targets * in
-    min(targs, 1f, targs)
+  	val targs = if (targets.asInstanceOf[AnyRef] != null) {val targs0 = targets * in; min(targs0, 1f, targs0); targs0} else null
     val alltargs = if (targmap.asInstanceOf[AnyRef] != null) targmap * targs else targs
     val dweights = if (iweight.asInstanceOf[AnyRef] != null) iweight * in else null
     meval3(in, alltargs, dweights)
@@ -208,7 +207,8 @@ class FM(override val opts:FM.Opts = new FM.Options) extends RegressionModel(opt
   // Evaluate the positive/negative factorizations
   
   def meval3(in:Mat, targ:Mat, dweights:Mat):FMat = {
-    val ftarg = full(targ)
+  	val ftarg = if (targ.asInstanceOf[AnyRef] != null) full(targ) else null;
+  	val targs = if (targmap.asInstanceOf[AnyRef] != null && ftarg.asInstanceOf[AnyRef] != null) targmap * ftarg else ftarg;    
     val vt1 = mm1 * in;
     var vt2:Mat = null;
     if (opts.dim2 > 0) {
@@ -229,11 +229,16 @@ class FM(override val opts:FM.Opts = new FM.Options) extends RegressionModel(opt
     }
     GLM.preds(eta, eta, mylinks, totflops);
     if (ogmats != null) ogmats(0) = eta;
-    val v = GLM.llfun(eta, ftarg, mylinks, totflops);
-    if (dweights.asInstanceOf[AnyRef] != null) {
-      FMat(sum(v ∘  dweights, 2) / sum(dweights));
+    
+    if (targs.asInstanceOf[AnyRef] != null) {
+    	val v = GLM.llfun(eta, targs, mylinks, totflops);
+    	if (dweights.asInstanceOf[AnyRef] != null) {
+    		FMat(sum(v ∘  dweights, 2) / sum(dweights));
+    	} else {
+    		FMat(mean(v, 2));
+    	}
     } else {
-      FMat(mean(v, 2));
+      row(0);
     }
   }
   
@@ -322,7 +327,6 @@ object FM {
     val nopts = new PredOptions;
     nopts.batchSize = math.min(10000, mat1.ncols/30 + 1)
     nopts.links = mopts.links.copy;
-    nopts.putBack = 1;
     nopts.dim1 = mopts.dim1;
     nopts.dim2 = mopts.dim2;
     nopts.strictFM = mopts.strictFM;
diff --git a/src/main/scala/BIDMach/models/GLM.scala b/src/main/scala/BIDMach/models/GLM.scala
@@ -906,7 +906,6 @@ object GLM {
     nopts.links = mopts.links
     mopts.links.set(d)
     nopts.batchSize = mopts.batchSize
-    nopts.putBack = 1
     val model = new GLM(mopts)
     val mm = new Learner(
         new MatSource(Array(mat0, targ), mopts), 
@@ -1017,7 +1016,6 @@ object GLM {
     val model = model0.asInstanceOf[GLM]
     val nopts = new PredOptions;
     nopts.batchSize = math.min(10000, mat1.ncols/30 + 1)
-    nopts.putBack = 0
     val newmod = new GLM(nopts);
     newmod.refresh = false
     newmod.copyFrom(model);
@@ -1070,7 +1068,6 @@ object GLM {
     mopts.reg2weight = 1f
     nopts.links = mopts.links
     nopts.batchSize = mopts.batchSize
-    nopts.putBack = 1
     val model = new GLM(mopts)
     val mm = new Learner(
         new MatSource(Array(mat0, targ), mopts), 
@@ -1095,7 +1092,6 @@ object GLM {
     nopts.batchSize = math.min(10000, mat1.ncols/30 + 1)
     if (nopts.links == null) nopts.links = izeros(preds.nrows,1)
     nopts.links.set(3)
-    nopts.putBack = 1
     val nn = new Learner(
         new MatSource(Array(mat1, preds), nopts), 
         model.asInstanceOf[GLM], 
diff --git a/src/main/scala/BIDMach/models/Regression.scala b/src/main/scala/BIDMach/models/Regression.scala
@@ -34,8 +34,10 @@ abstract class RegressionModel(override val opts:RegressionModel.Opts) extends M
       opts.targmap.nrows 
     } else if (opts.targets.asInstanceOf[AnyRef] != null) {
       opts.targets.nrows 
-    } else {
+    } else if (refresh) {
       mats(1).nrows  
+    } else {
+      modelmats(0).nrows;
     }
     val sdat = (sum(data0,2).t + 0.5f).asInstanceOf[FMat]
     sp = sdat / sum(sdat)
diff --git a/src/main/scala/BIDMach/networks/Net.scala b/src/main/scala/BIDMach/networks/Net.scala
@@ -288,9 +288,9 @@ class Net(override val opts:Net.Opts = new Net.Options) extends Model(opts) {
   			}
   			layers(i).forward;
   		}
-  		val scores = zeros(score_layers.length, 1);
+  		val scores = zeros(score_layers.length, batchSize);
   		for (i <- 0 until score_layers.length) {
-  			scores(i) = score_layers(i).score.v;
+  			scores(i,?) = score_layers(i).score;
   		}
   		if (og_layers.asInstanceOf[AnyRef] != null) {
   			for (i <- 0 until og_layers.length) {
diff --git a/src/main/scala/BIDMach/networks/layers/GLMLayer.scala b/src/main/scala/BIDMach/networks/layers/GLMLayer.scala
@@ -47,7 +47,7 @@ class GLMLayer(override val net:Net, override val opts:GLMNodeOpts = new GLMNode
 
 	override def score:FMat = { 
 			val v = if (target.asInstanceOf[AnyRef] != null) GLM.llfun(output, target, ilinks, totflops) else row(0);
-			FMat(mean(mean(v, 2)));
+			FMat(mean(v));
 	}
 	
 	override def clear = {
diff --git a/src/main/scala/BIDMach/networks/layers/Layer.scala b/src/main/scala/BIDMach/networks/layers/Layer.scala
@@ -535,11 +535,10 @@ object Layer {
 
   def softmax(a:LayerTerm) = new SoftmaxLayer(null){inputs(0) = a};
   
-  def softmaxout(a:LayerTerm)(scoreType:Int=0, doVariance:Boolean=false, lossType:Int = 0, net:Net=null) =  {
+  def softmaxout(a:LayerTerm)(scoreType:Int=0, lossType:Int = 0, net:Net=null) =  {
     val scoreTyp = scoreType;
     val lossTyp = lossType;
-    val doVar = doVariance;
-    new SoftmaxOutputLayer(net, new SoftmaxOutputNode{scoreType=scoreTyp; doVariance=doVar; lossType=lossTyp}){inputs(0) = a}
+    new SoftmaxOutputLayer(net, new SoftmaxOutputNode{scoreType=scoreTyp; lossType=lossTyp}){inputs(0) = a}
   }
   
   def softplus(a:LayerTerm) = new SoftplusLayer(null){inputs(0) = a};
diff --git a/src/main/scala/BIDMach/networks/layers/NegsampOutputLayer.scala b/src/main/scala/BIDMach/networks/layers/NegsampOutputLayer.scala
@@ -129,8 +129,8 @@ class NegsampOutputLayer(override val net:Net, override val opts:NegsampOutputNo
       if (coloffsets.asInstanceOf[AnyRef] == null) coloffsets = int(convertMat(irow(0->mprod.ncols)*mprod.nrows));
       val inds = int(target) + coloffsets;
       opts.scoreType match {
-        case 2 => FMat(mean(ln(mprod(inds))));
-        case 3 => FMat(mean(mprod(inds) == maxi(mprod)));        
+        case 2 => FMat(ln(mprod(inds)));
+        case 3 => FMat(mprod(inds) == maxi(mprod));        
       }
     }
   }
diff --git a/src/main/scala/BIDMach/networks/layers/Node.scala b/src/main/scala/BIDMach/networks/layers/Node.scala
@@ -343,10 +343,10 @@ object Node {
 
   def softmax(a:NodeTerm) = new SoftmaxNode{inputs(0) = a};
   
-  def softmaxout(a:NodeTerm)(scoreType:Int=0, doVar:Boolean=false, lossType:Int=0) =  {
+  def softmaxout(a:NodeTerm)(scoreType:Int=0, lossType:Int=0) =  {
     val scoreTyp = scoreType;
     val lossTyp = lossType;
-    new SoftmaxOutputNode{inputs(0) = a; scoreType=scoreTyp; doVariance = doVar; lossType = lossTyp}
+    new SoftmaxOutputNode{inputs(0) = a; scoreType=scoreTyp; lossType = lossTyp}
   }
   
   def softplus(a:NodeTerm) = new SoftplusNode{inputs(0) = a};
diff --git a/src/main/scala/BIDMach/networks/layers/SoftmaxOutputLayer.scala b/src/main/scala/BIDMach/networks/layers/SoftmaxOutputLayer.scala
@@ -79,19 +79,9 @@ class SoftmaxOutputLayer(override val net:Net, override val opts:SoftmaxOutputNo
     if (coloffsets.asInstanceOf[AnyRef] == null) coloffsets = int(convertMat(irow(0->output.ncols)*output.nrows));
     val inds = int(target) + coloffsets;
     if (opts.scoreType == SoftmaxOutputLayer.AccuracyScore) {
-      if (opts.doVariance) {
-        val matches = (output(inds) == maxi(output));
-        FMat(mean(matches)) on FMat(variance(matches));
-      } else {
-      	FMat(mean(output(inds) == maxi(output)));
-      }
+    	FMat(output(inds) == maxi(output));
     } else {
-    	if (opts.doVariance) {
-    	  val out = ln(output(inds));
-    	  FMat(mean(out)) on FMat(variance(out));
-    	} else {
-    		FMat(mean(ln(output(inds))));   
-    	}
+    	FMat(ln(output(inds)));
     }
   }
   
@@ -110,15 +100,13 @@ class SoftmaxOutputLayer(override val net:Net, override val opts:SoftmaxOutputNo
 
 trait SoftmaxOutputNodeOpts extends NodeOpts {
 	var scoreType = 0;
-	var doVariance = false;
 	var lossType = 0;
 	var eps = 1e-5f;
 		
 	def copyOpts(opts:SoftmaxOutputNodeOpts):SoftmaxOutputNodeOpts = {
 			super.copyOpts(opts);
 			opts.scoreType = scoreType;
 			opts.lossType = lossType;
-			opts.doVariance = doVariance;
 			opts.eps = eps;
 			opts;
 	}

Original file line number	Diff line number	Diff line change
`@@ -288,9 +288,9 @@ class Net(override val opts:Net.Opts = new Net.Options) extends Model(opts) {`
`288`	`288`	`}`
`289`	`289`	`layers(i).forward;`
`290`	`290`	`}`
`291`		`- val scores = zeros(score_layers.length, 1);`
	`291`	`+ val scores = zeros(score_layers.length, batchSize);`
`292`	`292`	`for (i <- 0 until score_layers.length) {`
`293`		`- scores(i) = score_layers(i).score.v;`
	`293`	`+ scores(i,?) = score_layers(i).score;`
`294`	`294`	`}`
`295`	`295`	`if (og_layers.asInstanceOf[AnyRef] != null) {`
`296`	`296`	`for (i <- 0 until og_layers.length) {`
Original file line number	Diff line number	Diff line change
`@@ -47,7 +47,7 @@ class GLMLayer(override val net:Net, override val opts:GLMNodeOpts = new GLMNode`
`47`	`47`
`48`	`48`	`override def score:FMat = {`
`49`	`49`	`val v = if (target.asInstanceOf[AnyRef] != null) GLM.llfun(output, target, ilinks, totflops) else row(0);`
`50`		`- FMat(mean(mean(v, 2)));`
	`50`	`+ FMat(mean(v));`
`51`	`51`	`}`
`52`	`52`
`53`	`53`	`override def clear = {`
Original file line number	Diff line number	Diff line change
`@@ -129,8 +129,8 @@ class NegsampOutputLayer(override val net:Net, override val opts:NegsampOutputNo`
`129`	`129`	`if (coloffsets.asInstanceOf[AnyRef] == null) coloffsets = int(convertMat(irow(0->mprod.ncols)*mprod.nrows));`
`130`	`130`	`val inds = int(target) + coloffsets;`
`131`	`131`	`opts.scoreType match {`
`132`		`- case 2 => FMat(mean(ln(mprod(inds))));`
`133`		`- case 3 => FMat(mean(mprod(inds) == maxi(mprod)));`
	`132`	`+ case 2 => FMat(ln(mprod(inds)));`
	`133`	`+ case 3 => FMat(mprod(inds) == maxi(mprod));`
`134`	`134`	`}`
`135`	`135`	`}`
`136`	`136`	`}`