from glob import glob import os import sys os.environ['SPARK_HOME'] = 'C:\\Users\\MyName\\Documents\\spark-1.4.0-bin-hadoop2.6' spark_home = os.environ.get('SPARK_HOME') pyspark_path = os.path.join(spark_home, 'python') sys.path.insert(0, pyspark_path) for z in glob(os.path.join(pyspark_path, 'lib', 'py4j*.zip')): sys.path.insert(0, z) os.environ['SPARK_SCALA_VERSION'] = '2.10' import pyspark.shell as ps sc = ps.sc sqlCtx = ps.sqlCtx