Init PyTest

This commit is contained in:
Yûki VACHOT 2024-01-05 17:10:52 +01:00
parent c4fdb2860c
commit 25c2e6b7cb
8 changed files with 100 additions and 44 deletions

48
init.py
View file

@ -1,34 +1,6 @@
import os
import findspark
from pyspark.sql import SparkSession
import pyspark.sql.functions as F
spark = SparkSession.builder.master("local[*]").getOrCreate()
sample_data = [
{"name": "John D.", "age": 30},
{"name": "Alice G.", "age": 25},
{"name": "Bob T.", "age": 35},
{"name": "Eve A.", "age": 28}
]
df = spark.createDataFrame(sample_data)
transformed_df = remove_extra_spaces(df, "name")
transformed_df.show()
def main():
init_env()
print("hey there")
if __name__ == "__main__":
main()
def init_env():
@ -36,4 +8,22 @@ def init_env():
os.environ["SPARK_HOME"] = "C:\\SPARK\\spark-3.1.1-bin-hadoop3.2"
os.environ["HADOOP_HOME"] = "C:\\SPARK\\hadoop"
findspark.init()
findspark.init()
def init_spark():
spark = SparkSession.builder.master("local[*]").getOrCreate()
df = spark.createDataFrame([
{'name': 'OUI OUI', 'age': 30},
])
df.show()
def main():
print("hey there")
init_env()
init_spark()
if __name__ == "__main__":
main()