-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathcontext.py
More file actions
27 lines (22 loc) · 1.18 KB
/
context.py
File metadata and controls
27 lines (22 loc) · 1.18 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
from pyspark.sql import SparkSession
from pyspark import SparkConf
def get_local_spark_context():
conf = SparkConf() \
.setMaster("local[*]") \
.setAppName("test") \
.set("spark.driver.memory", "5g") \
.set("spark.driver.host", "127.0.0.1") \
.set("spark.driver.port", "8082") \
.set("spark.jars.packages", "org.apache.hadoop:hadoop-aws:3.2.2")
conf.set("spark.hadoop.fs.s3a.impl", "org.apache.hadoop.fs.s3a.S3AFileSystem") \
.set("spark.hadoop.fs.s3a.path.style.access", "true") \
.set("spark.hadoop.fs.s3a.connection.ssl.enabled", "false") \
.set("spark.hadoop.fs.s3a.aws.credentials.provider",
"org.apache.hadoop.fs.s3a.TemporaryAWSCredentialsProvider") \
.set("spark.hadoop.fs.s3a.access.key", "mock") \
.set("spark.hadoop.fs.s3a.secret.key", "mock") \
.set("spark.hadoop.fs.s3a.session.token", "mock") \
.set("spark.hadoop.fs.s3a.impl", "org.apache.hadoop.fs.s3a.S3AFileSystem") \
.set("spark.hadoop.fs.s3a.endpoint", "http://localhost:4566")
spark_context = SparkSession.builder.config(conf=conf).enableHiveSupport().getOrCreate()
return spark_context