seed = 10
sampleby = 'colA'
fraction=0.8
franctions = df.select(sampleby).distinct().withColumn('fraction', lit(fraction)).rdd.collec
seed = 10
sampleby = 'colA'
fraction=0.8
franctions = df.select(sampleby).distinct().withColumn('fraction', lit(fraction)).rdd.collec