Skip to content

Commit

Permalink
Update medium-stats-spark-driver.py
Browse files Browse the repository at this point in the history
  • Loading branch information
pavan-kumar-99 authored Jun 12, 2024
1 parent 6ab67d7 commit 7dba05b
Showing 1 changed file with 2 additions and 6 deletions.
8 changes: 2 additions & 6 deletions scripts/medium/medium-stats-spark-driver.py
Original file line number Diff line number Diff line change
Expand Up @@ -78,13 +78,9 @@ def process_data(bucket_name, bucket_prefix, local_path):
"hadoop",
)
.config(f"spark.sql.defaultCatalog", f"{catalog_name}")
.config(
f"spark.sql.catalog.{catalog_name}.s3.endpoint",
"http://minio-server.minio:9000",
)
.config(
f"spark.sql.catalog.{catalog_name}.s3a.endpoint",
"http://minio-server.minio:9000",
"http://minio-server.minio:9000/",
)
.config(
"spark.sql.extensions",
Expand Down Expand Up @@ -208,7 +204,7 @@ def compute_yearly_statistics(spark, table_name):
local_path = "/usr/stats/" + args.key
bucket_name = "medium-stats"
iceberg_bucket_name = "iceberg-table"
iceberg_bucket_prefix = "iceberg-tables/"
iceberg_bucket_prefix = "warehouse/"
temp_table_name = "mediumstatstemp"

download_from_s3(bucket_name, args.key, local_path)
Expand Down

0 comments on commit 7dba05b

Please sign in to comment.