Search code examples
scalabinary-search-treescalacheck

ScalaCheck generate BST


I'm trying to create a Gen for BST with ScalaCheck, but when I call .sample method it gives me java.lang.NullPointerException. Where do I wrong?

sealed trait Tree

case class Node(left: Tree, right: Tree, v: Int) extends Tree

case object Leaf extends Tree

import org.scalacheck._
import Gen._
import Arbitrary.arbitrary

case class GenerateBST() {

  def genValue(left: Tree, right: Tree): Gen[Int] = (left, right) match {
    case (Node(_, _, min), Node(_, _, max)) => arbitrary[Int].suchThat(x => x > min && x < max)
    case (Node(_, _, min), Leaf) => arbitrary[Int].suchThat(x => x > min)
    case (Leaf, Node(_, _, max)) => arbitrary[Int].suchThat(x => x < max)
    case (Leaf, Leaf) => arbitrary[Int]
  }


  val genNode = for {
    left <- genTree
    right <- genTree
    v <- genValue(left, right)
  } yield Node(left, right, v)

  def genTree: Gen[Tree] = oneOf(const(Leaf), genNode)
}

GenerateBST().genTree.sample

Solution

  • Because of the way you're defining the generator recursively for a recursive data type, you need to use Gen.lzy at the top:

    def genTree: Gen[Tree] = Gen.lzy(oneOf(const(Leaf), genNode))
    

    As an unrelated side note, using suchThat in your generator definitions should generally only be a last resort. It means that sample will often fail (about a third of the time with the fixed version of your code), and more importantly that if you someday want to create arbitrary functions resulting in Tree, you're going to see a lot of horrible org.scalacheck.Gen$RetrievalError: couldn't generate value exceptions.

    In this case you can avoid suchThat pretty easily by using Gen.chooseNum and swapping the left and right sides if they're in the wrong ordered:

    sealed trait Tree
    case class Node(left: Tree, right: Tree, v: Int) extends Tree
    case object Leaf extends Tree
    
    import org.scalacheck.{ Arbitrary, Gen }
    
    object GenerateBST {
      def swapIfNeeded(l: Tree, r: Tree): (Tree, Tree) = (l, r) match {
        // If the two trees don't have space between them, we bump one and recheck:
        case (Node(_, _, x), n @ Node(_, _, y)) if math.abs(x - y) <= 1 =>
          swapIfNeeded(l, n.copy(v = y + 1))
        // If the values are in the wrong order, swap:
        case (Node(_, _, x), Node(_, _, y)) if x > y => (r, l)
        // Otherwise do nothing:
        case (_, _) => (l, r)
      }
    
      def genValue(left: Tree, right: Tree): Gen[Int] = (left, right) match {
        case (Node(_, _, min), Node(_, _, max)) => Gen.chooseNum(min + 1, max - 1)
        case (Node(_, _, min), Leaf) => Gen.chooseNum(min + 1, Int.MaxValue)
        case (Leaf, Node(_, _, max)) => Gen.chooseNum(Int.MinValue, max - 1)
        case (Leaf, Leaf) => Arbitrary.arbitrary[Int]
      }
    
      val genNode = for {
        l0 <- genTree
        r0 <- genTree
        (left, right) = swapIfNeeded(l0, r0)
        v <- genValue(left, right)
      } yield Node(left, right, v)
    
      def genTree: Gen[Tree] = Gen.lzy(Gen.oneOf(Gen.const(Leaf), genNode))
    }
    

    Now you can use Arbitrary[Whatever => Tree] without worrying about generator failures:

    scala> implicit val arbTree: Arbitrary[Tree] = Arbitrary(GenerateBST.genTree)
    arbTree: org.scalacheck.Arbitrary[Tree] = org.scalacheck.ArbitraryLowPriority$$anon$1@606abb0e
    
    scala> val f = Arbitrary.arbitrary[Int => Tree].sample.get
    f: Int => Tree = org.scalacheck.GenArities$$Lambda$7109/289518656@13eefeaf
    
    scala> f(1)
    res0: Tree = Leaf
    
    scala> f(2)
    res1: Tree = Node(Leaf,Leaf,-20313200)
    
    scala> f(3)
    res2: Tree = Leaf
    
    scala> f(4)
    res3: Tree = Node(Node(Leaf,Leaf,-850041807),Leaf,-1)