This is an automated email from the ASF dual-hosted git repository. potiuk pushed a commit to branch main in repository https://gitbox.apache.org/repos/asf/airflow-site-archive.git
The following commit(s) were added to refs/heads/main by this push: new c505a11a15 Fix remote-path calculation for selective s3->GH sync c505a11a15 is described below commit c505a11a150810e49421d38e6302df0137ef7d12 Author: Jarek Potiuk <ja...@potiuk.com> AuthorDate: Sun May 11 12:41:32 2025 +0200 Fix remote-path calculation for selective s3->GH sync --- scripts/s3_to_github.py | 15 +++++++++------ 1 file changed, 9 insertions(+), 6 deletions(-) diff --git a/scripts/s3_to_github.py b/scripts/s3_to_github.py index 738586a3aa..74f99d9f99 100644 --- a/scripts/s3_to_github.py +++ b/scripts/s3_to_github.py @@ -47,14 +47,17 @@ class S3TOGithub(CommonTransferUtils): ) return response["KeyCount"] > 0 - def sync_to_s3(self, processes: int, folders: list[str] | None = None): + def sync_s3_to_github(self, processes: int, folders: list[str] | None = None, + remote_prefix: str = "docs/"): console.print("[blue] Syncing files from S3 to GitHub...[/]") - prefixes = self.get_list_of_folders() if not folders else folders + prefixes = self.get_list_of_folders() if not folders else [ + f"{remote_prefix}{folder}" for folder in folders + ] pool_args = [] for pref in prefixes: source_bucket_path = f"s3://{self.bucket_name}/{pref}" - # we want to store the files in the github under docs-archive/ - destination = self.local_path + pref.replace("docs/", "") + # we want to store the files in the github under local_path + destination = self.local_path + pref.replace(remote_prefix, "") pool_args.append((source_bucket_path, destination)) self.run_with_pool(self.sync, pool_args, processes=processes) @@ -90,9 +93,9 @@ if __name__ == "__main__": sys.exit(1) folders_to_sync = sort_priority_folders(folders_to_sync) - syncer.sync_to_s3(processes=int(args.processes), folders=folders_to_sync) + syncer.sync_s3_to_github(processes=int(args.processes), folders=folders_to_sync) else: - syncer.sync_to_s3(processes=int(args.processes)) + syncer.sync_s3_to_github(processes=int(args.processes))