In [1]: import findspark In [2]: findspark.init('/home/hak/spark-2.4.5-bin-hadoop2.7/') In [3]: from pyspark.sql import SparkSession In [4]: spark = SparkSession.builder.appName('MissingData').getOrCreate() In [5]: df = spark.read.csv('ContainsNull.csv',header=True, inferSchema=True) In [6]: df.show() +----+-----+-----+ | Id| Name|Sales| +----+-----+-----+ |emp1| John| nu..