>>> df = session.create_dataframe([[1, 2], [1, 2], [3, None], [2, 3], [3, None], [4, None]], schema=["a", "b"])
>>> df.select(count_distinct(col("a"), col("b")).alias("result")).show()
------------
|"RESULT" |
------------
|2 |
------------
>>> # The result should be 2 for {[1,2],[2,3]} since the rest are either duplicate or NULL records