Skip to content

Commit

Permalink
compute on extract_and_upload
Browse files Browse the repository at this point in the history
  • Loading branch information
davedavemckay committed Feb 4, 2025
1 parent 8cafd61 commit 8fd18c6
Showing 1 changed file with 1 addition and 2 deletions.
3 changes: 1 addition & 2 deletions scripts/process_collated_zips.py
Original file line number Diff line number Diff line change
Expand Up @@ -301,9 +301,8 @@ def error(self, message):
client.scatter(keys_series)
keys_df['extract'] = keys_df.apply(verify_zip_contents, meta=('extract', 'bool'), keys_series=keys_series, axis=1)
del keys_series
keys_df['extracted and uploaded'] = keys_df.apply(extract_and_upload, conn=conn, bucket_name=bucket_name, meta=('extracted and uploaded', 'bool'), axis=1)
dprint('Zip files extracted and uploaded:')
dprint(keys_df[keys_df['extracted and uploaded'] == True]['key'].compute())
keys_df['extracted and uploaded'] = keys_df.apply(extract_and_upload, conn=conn, bucket_name=bucket_name, meta=('extracted and uploaded', 'bool'), axis=1).compute()
rm_parquet(pq3)
dprint('Done.')

Expand Down

0 comments on commit 8fd18c6

Please sign in to comment.