SPARK-2748 [MLLIB] [GRAPHX] Loss of precision for small arguments to Math.exp, Math.log

srowen · mengxr · commit ee07541e99f0 · 2014-07-30T08:55:15.000-07:00
In a few places in MLlib, an expression of the form `log(1.0 + p)` is evaluated. When p is so small that `1.0 + p == 1.0`, the result is 0.0. However the correct answer is very near `p`. This is why `Math.log1p` exists. Similarly for one instance of `exp(m) - 1` in GraphX; there's a special `Math.expm1` method. While the errors occur only for very small arguments, given their use in machine learning algorithms, this is entirely possible. Also note the related PR for Python: #1652 Author: Sean Owen <srowen@gmail.com> Closes #1659 from srowen/SPARK-2748 and squashes the following commits: c5926d4 [Sean Owen] Use log1p, expm1 for better precision for tiny arguments
diff --git a/graphx/src/main/scala/org/apache/spark/graphx/util/GraphGenerators.scala b/graphx/src/main/scala/org/apache/spark/graphx/util/GraphGenerators.scala
@@ -100,8 +100,10 @@ object GraphGenerators {
    */
   private def sampleLogNormal(mu: Double, sigma: Double, maxVal: Int): Int = {
     val rand = new Random()
-    val m = math.exp(mu + (sigma * sigma) / 2.0)
-    val s = math.sqrt((math.exp(sigma*sigma) - 1) * math.exp(2*mu + sigma*sigma))
+    val sigmaSq = sigma * sigma
+    val m = math.exp(mu + sigmaSq / 2.0)
+    // expm1 is exp(m)-1 with better accuracy for tiny m
+    val s = math.sqrt(math.expm1(sigmaSq) * math.exp(2*mu + sigmaSq))
     // Z ~ N(0, 1)
     var X: Double = maxVal
 
diff --git a/mllib/src/main/scala/org/apache/spark/mllib/optimization/Gradient.scala b/mllib/src/main/scala/org/apache/spark/mllib/optimization/Gradient.scala
@@ -68,9 +68,9 @@ class LogisticGradient extends Gradient {
     val gradient = brzData * gradientMultiplier
     val loss =
       if (label > 0) {
-        math.log(1 + math.exp(margin))
+        math.log1p(math.exp(margin)) // log1p is log(1+p) but more accurate for small p
       } else {
-        math.log(1 + math.exp(margin)) - margin
+        math.log1p(math.exp(margin)) - margin
       }
 
     (Vectors.fromBreeze(gradient), loss)
@@ -89,9 +89,9 @@ class LogisticGradient extends Gradient {
     brzAxpy(gradientMultiplier, brzData, cumGradient.toBreeze)
 
     if (label > 0) {
-      math.log(1 + math.exp(margin))
+      math.log1p(math.exp(margin))
     } else {
-      math.log(1 + math.exp(margin)) - margin
+      math.log1p(math.exp(margin)) - margin
     }
   }
 }

Original file line number	Diff line number	Diff line change
`@@ -68,9 +68,9 @@ class LogisticGradient extends Gradient {`
`68`	`68`	`val gradient = brzData * gradientMultiplier`
`69`	`69`	`val loss =`
`70`	`70`	`if (label > 0) {`
`71`		`- math.log(1 + math.exp(margin))`
	`71`	`+ math.log1p(math.exp(margin)) // log1p is log(1+p) but more accurate for small p`
`72`	`72`	`} else {`
`73`		`- math.log(1 + math.exp(margin)) - margin`
	`73`	`+ math.log1p(math.exp(margin)) - margin`
`74`	`74`	`}`
`75`	`75`
`76`	`76`	`(Vectors.fromBreeze(gradient), loss)`
`@@ -89,9 +89,9 @@ class LogisticGradient extends Gradient {`
`89`	`89`	`brzAxpy(gradientMultiplier, brzData, cumGradient.toBreeze)`
`90`	`90`
`91`	`91`	`if (label > 0) {`
`92`		`- math.log(1 + math.exp(margin))`
	`92`	`+ math.log1p(math.exp(margin))`
`93`	`93`	`} else {`
`94`		`- math.log(1 + math.exp(margin)) - margin`
	`94`	`+ math.log1p(math.exp(margin)) - margin`
`95`	`95`	`}`
`96`	`96`	`}`
`97`	`97`	`}`