Skip to content

Commit

Permalink
change source bucket for the Spark data lake example (#706)
Browse files Browse the repository at this point in the history
  • Loading branch information
vgkowski committed Aug 5, 2024
1 parent 57fff96 commit 45f0c8b
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions examples/spark-data-lake/infra/stacks/application_stack.py
Original file line number Diff line number Diff line change
Expand Up @@ -37,14 +37,14 @@ def __init__(
)

# Import the S3 bucket used as the Spark job source
source_bucket = s3.Bucket.from_bucket_name(self, 'SourceBucket', 'nyc-tlc')
source_bucket = s3.Bucket.from_bucket_name(self, 'SourceBucket', 'redshift-demos')

# Copy the Yellow taxi data in the silver bucket of the data lake
dsf.utils.S3DataCopy(
self,
"YellowDataCopy",
source_bucket=source_bucket,
source_bucket_prefix="trip data/yellow_tripdata_2019",
source_bucket_prefix="data/NY-Pub/year=2016/month=1/type=yellow",
source_bucket_region="us-east-1",
target_bucket= storage.silver_bucket,
target_bucket_prefix="yellow-trip-data/",
Expand All @@ -56,7 +56,7 @@ def __init__(
self,
"GreenDataCopy",
source_bucket=source_bucket,
source_bucket_prefix="trip data/green_tripdata_2019",
source_bucket_prefix="data/NY-Pub/year=2016/month=1/type=green",
source_bucket_region="us-east-1",
target_bucket= storage.silver_bucket,
target_bucket_prefix="green-trip-data/",
Expand Down

0 comments on commit 45f0c8b

Please sign in to comment.