git subrepo pull (merge) --force shared/vendored

nextstrain-bot · nextstrain-bot · commit aff84109bfda · 2026-04-15T21:10:30.000Z
subrepo: subdir: "shared/vendored" merged: "c29898f" upstream: origin: "https://github.com/nextstrain/shared" branch: "main" commit: "c29898f" git-subrepo: version: "0.4.9" origin: "https://github.com/ingydotnet/git-subrepo" commit: "5e0f401"
diff --git a/shared/vendored/.github/workflows/ci.yaml b/shared/vendored/.github/workflows/ci.yaml
@@ -11,5 +11,5 @@ jobs:
   shellcheck:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v5
+      - uses: actions/checkout@v6
       - uses: nextstrain/.github/actions/shellcheck@master
diff --git a/shared/vendored/.github/workflows/pre-commit.yaml b/shared/vendored/.github/workflows/pre-commit.yaml
@@ -7,7 +7,7 @@ jobs:
   pre-commit:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v5
+      - uses: actions/checkout@v6
       - uses: actions/setup-python@v6
         with:
           python-version: "3.12"
diff --git a/shared/vendored/.gitrepo b/shared/vendored/.gitrepo
@@ -6,7 +6,7 @@
 [subrepo]
 	remote = https://github.com/nextstrain/shared
 	branch = main
-	commit = 43e5a6fe06c95f605cc573a7e6ad2d4a023db7b9
-	parent = b6b1000536050c6ebcbde0c79902c16b0b76a11a
+	commit = c29898f7c32c3f85d65db235d23a78e776f89120
+	parent = 4d057604f9c65bae794c7bfe3f2d2514f7deee32
 	method = merge
-	cmdver = 0.4.6
+	cmdver = 0.4.9
diff --git a/shared/vendored/README.md b/shared/vendored/README.md
@@ -22,7 +22,7 @@ Then add the latest shared scripts to the pathogen repo by running:
 git subrepo clone https://github.com/nextstrain/shared shared/vendored
 ```
 
-Any future updates of sahred scripts can be pulled in with:
+Any future updates of shared scripts can be pulled in with:
 
 ```
 git subrepo pull shared/vendored
@@ -90,7 +90,7 @@ Scripts for supporting workflow automation that don’t really belong in any of
 - [notify-on-diff](scripts/notify-on-diff) - Send Slack message with diff of a local file and an S3 object
 - [notify-on-job-fail](scripts/notify-on-job-fail) - Send Slack message with details about failed workflow job on GitHub Actions and/or AWS Batch
 - [notify-on-job-start](scripts/notify-on-job-start) - Send Slack message with details about workflow job on GitHub Actions and/or AWS Batch
-- [notify-on-record-change](scripts/notify-on-recod-change) - Send Slack message with details about line count changes for a file compared to an S3 object's metadata `recordcount`.
+- [notify-on-record-change](scripts/notify-on-record-change) - Send Slack message with details about line count changes for a file compared to an S3 object's metadata `recordcount`.
   If the S3 object's metadata does not have `recordcount`, then will attempt to download S3 object to count lines locally, which only supports `xz` compressed S3 objects.
 - [notify-slack](scripts/notify-slack) - Send message or file to Slack
 - [s3-object-exists](scripts/s3-object-exists) - Used to prevent 404 errors during S3 file comparisons in the notify-* scripts
@@ -114,7 +114,7 @@ Potential Nextstrain CLI scripts
 - [upload-to-s3](scripts/upload-to-s3) - Upload file to AWS S3 bucket with compression based on file extension in S3 URL.
   Skips upload if the local file's hash is identical to the S3 object's metadata `sha256sum`.
   Adds the following user defined metadata to uploaded S3 object:
-    - `sha256sum` - hash of the file generated by [sha256sum](sha256sum)
+    - `sha256sum` - hash of the file generated by [sha256sum](scripts/sha256sum)
     - `recordcount` - the line count of the file
 - [download-from-s3](scripts/download-from-s3) - Download file from AWS S3 bucket with decompression based on file extension in S3 URL.
   Skips download if the local file already exists and has a hash identical to the S3 object's metadata `sha256sum`.
@@ -123,7 +123,7 @@ Potential Nextstrain CLI scripts
 
 Snakemake workflow functions that are shared across many pathogen workflows that don’t really belong in any of our existing tools.
 
-- [config.smk](snakemake/config.smk) - Shared functions for parsing workflow configs.
+- [config.smk](snakemake/config.smk) - Shared functions for handling workflow configs.
 - [remote_files.smk](snakemake/remote_files.smk) - Exposes the `path_or_url` function which will use Snakemake's storage plugins to download/upload files to remote providers as needed.
 
 
diff --git a/shared/vendored/snakemake/config.smk b/shared/vendored/snakemake/config.smk
@@ -1,19 +1,59 @@
 """
-Shared functions to be used within a Snakemake workflow for parsing
+Shared functions to be used within a Snakemake workflow for handling
 workflow configs.
 """
-import os.path
+import os
+import sys
+import yaml
 from collections.abc import Callable
-from snakemake.io import Wildcards
 from typing import Optional
 from textwrap import dedent, indent
 
 
+# Set search paths for Augur
+if "AUGUR_SEARCH_PATHS" in os.environ:
+    print(dedent(f"""\
+        Using existing search paths in AUGUR_SEARCH_PATHS:
+
+            {os.environ["AUGUR_SEARCH_PATHS"]!r}
+        """), file=sys.stderr)
+else:
+    # Note that this differs from the search paths used in
+    # resolve_config_path().
+    # This is the preferred default moving forwards, and the plan is to
+    # eventually update resolve_config_path() to use AUGUR_SEARCH_PATHS.
+    search_paths = [
+        # User analysis directory
+        Path.cwd(),
+
+        # Workflow defaults folder
+        Path(workflow.basedir) / "defaults",
+
+        # Workflow root (contains Snakefile)
+        Path(workflow.basedir),
+    ]
+
+    # This should work for majority of workflows, but we could consider doing a
+    # more thorough search for the nextstrain-pathogen.yaml. This would likely
+    # replicate how CLI searches for the root.¹
+    # ¹ <https://github.com/nextstrain/cli/blob/d5e184c5/nextstrain/cli/command/build.py#L413-L420>
+    repo_root = Path(workflow.basedir) / ".."
+    if (repo_root / "nextstrain-pathogen.yaml").is_file():
+        search_paths.extend([
+            # Pathogen repo root
+            repo_root,
+        ])
+
+    search_paths = [path.resolve() for path in search_paths if path.is_dir()]
+
+    os.environ["AUGUR_SEARCH_PATHS"] = ":".join(map(str, search_paths))
+
+
 class InvalidConfigError(Exception):
     pass
 
 
-def resolve_config_path(path: str, defaults_dir: Optional[str] = None) -> Callable[[Wildcards], str]:
+def resolve_config_path(path: str, defaults_dir: Optional[str] = None) -> Callable:
     """
     Resolve a relative *path* given in a configuration value. Will always try to
     resolve *path* after expanding wildcards with Snakemake's `expand` functionality.
@@ -75,3 +115,42 @@ def resolve_config_path(path: str, defaults_dir: Optional[str] = None) -> Callab
             """), " " * 4))
 
     return _resolve_config_path
+
+
+def write_config(path, section=None):
+    """
+    Write Snakemake's 'config' variable, or a section of it, to a file.
+
+    *section* is an optional list of keys to navigate to a specific section of
+    config. If provided, only that section will be written.
+    """
+    global config
+
+    os.makedirs(os.path.dirname(path), exist_ok=True)
+
+    data = config
+    section_str = "config"
+
+    if section:
+        # Navigate to the specified section
+        for key in section:
+            # Error if key doesn't exist
+            if key not in data:
+                raise Exception(f"ERROR: Key {key!r} not found in {section_str!r}.")
+
+            data = data[key]
+            section_str += f".{key}"
+
+            # Error if value is not a mapping
+            if not isinstance(data, dict):
+                raise Exception(f"ERROR: {section_str!r} is not a mapping of key/value pairs.")
+
+    with open(path, 'w') as f:
+        yaml.dump(data, f, sort_keys=False, Dumper=NoAliasDumper)
+
+    print(f"Saved {section_str!r} to {path!r}.", file=sys.stderr)
+
+
+class NoAliasDumper(yaml.SafeDumper):
+    def ignore_aliases(self, data):
+        return True