nextstrain · kimandrews · Feb 5, 2026 · Jan 30, 2026 · Jan 30, 2026 · Jan 30, 2026
diff --git a/README.md b/README.md
@@ -29,9 +29,9 @@ nextstrain build --image ghcr.io/nextstrain/tb:latest .
 By default, AWS S3 caching is **disabled**. All tb-profiler and snippy analyses run locally without uploading or downloading results from S3.
 
 #### To enable AWS S3 caching:
-1. Edit `defaults/config.yaml` and set `s3_bucket` to your bucket name:
+1. Edit `defaults/config.yaml` and set `s3_dst_unversioned` to your bucket destination path:
    ```yaml
-   s3_bucket: "your-bucket-name"
+   s3_dst_unversioned: "your-bucket-destination-path"
    ```
 2. Ensure AWS credentials are configured (via `aws configure` or environment variables)
 
@@ -48,13 +48,13 @@ The Nextstrain pipeline can automatically deploy resulting builds within the aus
 nextstrain build --image ghcr.io/nextstrain/tb:latest . deploy_all --configfile build-configs/nextstrain-automation/config.yaml
 ```
 
-Nextstrain's automated builds (run via GitHub Actions) use AWS S3 caching by setting `s3_bucket: "nextstrain-data"` in `build-configs/nextstrain-automation/config.yaml`. Results of tb-profiler and snippy analyses are stored in the `nextstrain-data` bucket for SRA samples that have already been analyzed in previous runs of this workflow, with the following file paths:
+Nextstrain's automated builds (run via GitHub Actions) use AWS S3 caching by setting `s3_dst_unversioned: "nextstrain-data-unversioned/files/workflows/tb/"` in `build-configs/nextstrain-automation/config.yaml`. Results of tb-profiler and snippy analyses are stored in the `nextstrain-data-unversioned` bucket for SRA samples that have already been analyzed in previous runs of this workflow, with the following file paths:
 
 ##### tb-profiler
-* `s3://nextstrain-data/files/workflows/tb/data/tbprofiler/results/{sample}.results.json.zst`
+* `s3://nextstrain-data-unversioned/files/workflows/tb/data/tbprofiler/results/{sample}.results.json.zst`
 ##### snippy 
-* `s3://nextstrain-data/files/workflows/tb/data/snippy/{sample}/snps.aligned.fa.zst`
-* `s3://nextstrain-data/files/workflows/tb/data/snippy/{sample}/snps.vcf.zst`
+* `s3://nextstrain-data-unversioned/files/workflows/tb/data/snippy/{sample}/snps.aligned.fa.zst`
+* `s3://nextstrain-data-unversioned/files/workflows/tb/data/snippy/{sample}/snps.vcf.zst`
 
 These results files should be deleted from the S3 bucket if changes are made to the workflow that would influence the files, such as changes to the parameters used in the tb-profiler or snippy analysis steps, updates to the tb-profiler or snippy installations, or addition of new sequence quality filtering steps prior to running tb-profiler or snippy.
 

diff --git a/Snakefile b/Snakefile
@@ -115,7 +115,7 @@ rule run_tbprofiler:
     output:
         touch("data/tbprofiler/flags/{sample}_flag.txt"),
     params:
-        s3_bucket=config["s3_bucket"],
+        s3_dst_unversioned=config["s3_dst_unversioned"],
         tb_output_path="data/tbprofiler/results/{sample}.results.json",
         fastq_outdir="data/fastq",
         tb_outdir="data/tbprofiler",
@@ -135,7 +135,7 @@ rule run_tbprofiler:
         {params.fastq_outdir} \
         {params.tb_outdir} \
         {threads} \
-        {params.s3_bucket} \
+        {params.s3_dst_unversioned} \
         || echo "tbprofiler failed at sample {wildcards.sample}"
         rm -f data/tbprofiler/bam/{wildcards.sample}.bam*
         rm -f data/tbprofiler/vcf/{wildcards.sample}.targets.vcf.gz
@@ -192,7 +192,7 @@ rule run_snippy:
         touch("data/snippy/flags/{sample}_flag.txt"),
     priority: 1000
     params:
-        s3_bucket=config["s3_bucket"],
+        s3_dst_unversioned=config["s3_dst_unversioned"],
         snippy_output_path="data/snippy/{sample}",
         fastq_outdir="data/fastq",
         reference=config["files"]["reference_genbank"],
@@ -212,7 +212,7 @@ rule run_snippy:
         {params.fastq_outdir} \
         {params.reference} \
         {threads} \
-        {params.s3_bucket} \
+        {params.s3_dst_unversioned} \
         || echo "snippy failed at sample {wildcards.sample}"
         rm -f data/fastq/{wildcards.sample}_*.fastq.gz
         rm -fr data/snippy/{wildcards.sample}/reference

diff --git a/build-configs/nextstrain-automation/config.yaml b/build-configs/nextstrain-automation/config.yaml
@@ -1,5 +1,5 @@
 custom_rules:
   - build-configs/nextstrain-automation/deploy.smk
 
-s3_bucket: "nextstrain-data"
+s3_dst_unversioned: "s3://nextstrain-data-unversioned/files/workflows/tb/"
 deploy_url: "s3://nextstrain-data"
diff --git a/defaults/config.yaml b/defaults/config.yaml
@@ -1,5 +1,5 @@
 strain_id_field: "accession"
-s3_bucket: ""
+s3_dst_unversioned: ""
 files:
     exclude: "defaults/dropped_strains.txt"
     reference_genbank: "defaults/GCF_000195955.2_ASM19595v2_genomic.gbff"

diff --git a/scripts/run_snippy.sh b/scripts/run_snippy.sh
@@ -6,18 +6,16 @@ snippy_output_path="$2"
 fastq_outdir="$3"
 reference="$4"
 threads="$5"
-s3_bucket="${6:-}"
-
-s3_path="files/workflows/tb/${snippy_output_path}"
+s3_dst_unversioned="${6:-}"
 
 # Check if S3 bucket is configured and accessible
 USE_S3=false
-if [[ -n "${s3_bucket}" ]]; then
-    if aws s3 ls "s3://${s3_bucket}" > /dev/null 2>&1; then
+if [[ -n "${s3_dst_unversioned}" ]]; then
+    if aws s3 ls "${s3_dst_unversioned}" > /dev/null 2>&1; then
         USE_S3=true
         echo "S3 bucket accessible. Will use S3 caching." >&2
     else
-        echo "Warning: Cannot access s3://${s3_bucket}. Running without S3 caching." >&2
+        echo "Warning: Cannot access ${s3_dst_unversioned}. Running without S3 caching." >&2
     fi
 else
     echo "S3 bucket not specified. Running without S3 caching." >&2
@@ -45,18 +43,18 @@ upload_zstd() {
 
 # Try to download from S3 if enabled and BOTH expected .zst files exist
 if [[ "$USE_S3" == "true" ]] \
-   && aws s3 ls "s3://${s3_bucket}/${s3_path}/snps.aligned.fa.zst" >/dev/null 2>&1 \
-   && aws s3 ls "s3://${s3_bucket}/${s3_path}/snps.vcf.zst" >/dev/null 2>&1; then
+   && aws s3 ls "${s3_dst_unversioned}/${snippy_output_path}/snps.aligned.fa.zst" >/dev/null 2>&1 \
+   && aws s3 ls "${s3_dst_unversioned}/${snippy_output_path}/snps.vcf.zst" >/dev/null 2>&1; then
     echo "Found snippy results on S3 (.zst). Downloading to ${snippy_output_path} …" >&2
     mkdir -p "$(dirname "${snippy_output_path}")" "${snippy_output_path}"
 
     # Download and decompress aligned.fa, then remove local .zst
-    aws s3 cp "s3://${s3_bucket}/${s3_path}/snps.aligned.fa.zst" "${snippy_output_path}/snps.aligned.fa.zst"
+    aws s3 cp "${s3_dst_unversioned}/${snippy_output_path}/snps.aligned.fa.zst" "${snippy_output_path}/snps.aligned.fa.zst"
     zstd -d -f "${snippy_output_path}/snps.aligned.fa.zst" -o "${snippy_output_path}/snps.aligned.fa"
     rm -f "${snippy_output_path}/snps.aligned.fa.zst"
 
     # Download and decompress vcf, then remove local .zst
-    aws s3 cp "s3://${s3_bucket}/${s3_path}/snps.vcf.zst" "${snippy_output_path}/snps.vcf.zst"
+    aws s3 cp "${s3_dst_unversioned}/${snippy_output_path}/snps.vcf.zst" "${snippy_output_path}/snps.vcf.zst"
     zstd -d -f "${snippy_output_path}/snps.vcf.zst" -o "${snippy_output_path}/snps.vcf"
     rm -f "${snippy_output_path}/snps.vcf.zst"
 
@@ -110,7 +108,7 @@ else
     # Upload to S3 if enabled
     if [[ "$USE_S3" == "true" ]]; then
         echo "Uploading compressed snippy results to S3…" >&2
-        upload_zstd "${snippy_output_path}/snps.aligned.fa" "s3://${s3_bucket}/${s3_path}/snps.aligned.fa"
-        upload_zstd "${snippy_output_path}/snps.vcf"         "s3://${s3_bucket}/${s3_path}/snps.vcf"
+        upload_zstd "${snippy_output_path}/snps.aligned.fa" "${s3_dst_unversioned}/${snippy_output_path}/snps.aligned.fa"
+        upload_zstd "${snippy_output_path}/snps.vcf"         "${s3_dst_unversioned}/${snippy_output_path}/snps.vcf"
     fi
 fi
diff --git a/scripts/run_tbprofiler.sh b/scripts/run_tbprofiler.sh
@@ -6,29 +6,27 @@ tb_output_path="$2"
 fastq_outdir="$3"
 tb_outdir="$4"
 threads="$5"
-s3_bucket="${6:-}"
-
-s3_path="files/workflows/tb/${tb_output_path}"  # S3 key for the (compressed) tb-profiler output
+s3_dst_unversioned="${6:-}"
 
 # Check if S3 bucket is configured and accessible
 USE_S3=false
-if [[ -n "${s3_bucket}" ]]; then
-    if aws s3 ls "s3://${s3_bucket}" > /dev/null 2>&1; then
+if [[ -n "${s3_dst_unversioned}" ]]; then
+    if aws s3 ls "${s3_dst_unversioned}" > /dev/null 2>&1; then
         USE_S3=true
         echo "S3 bucket accessible. Will use S3 caching." >&2
     else
-        echo "Warning: Cannot access s3://${s3_bucket}. Running without S3 caching." >&2
+        echo "Warning: Cannot access ${s3_dst_unversioned}. Running without S3 caching." >&2
     fi
 else
     echo "S3 bucket not specified. Running without S3 caching." >&2
 fi
 
 # Try to download from S3 if enabled and results exist
-if [[ "$USE_S3" == "true" ]] && aws s3 ls "s3://${s3_bucket}/${s3_path}.zst" >/dev/null 2>&1; then
+if [[ "$USE_S3" == "true" ]] && aws s3 ls "${s3_dst_unversioned}/${tb_output_path}.zst" >/dev/null 2>&1; then
     echo "Found tb-profiler results on S3 (.zst). Downloading to ${tb_output_path} …" >&2
     mkdir -p "$(dirname "${tb_output_path}")"
 
-    aws s3 cp "s3://${s3_bucket}/${s3_path}.zst" "${tb_output_path}.zst"
+    aws s3 cp "${s3_dst_unversioned}/${tb_output_path}.zst" "${tb_output_path}.zst"
     zstd -d -f "${tb_output_path}.zst" -o "${tb_output_path}"
     rm -f "${tb_output_path}.zst"
 
@@ -80,7 +78,7 @@ else
         echo "Uploading compressed tb-profiler result to S3…" >&2
         # Compress -> upload -> remove local .zst (leave plain file locally)
         zstd -f -T"${threads}" -19 "${tb_output_path}" -o "${tb_output_path}.zst"
-        aws s3 cp "${tb_output_path}.zst" "s3://${s3_bucket}/${s3_path}.zst"
+        aws s3 cp "${tb_output_path}.zst" "${s3_dst_unversioned}/${tb_output_path}.zst"
         rm -f "${tb_output_path}.zst"
     fi
 fi