cmu-delphi
diff --git a/‎.github/workflows/pull_baselines.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/pull_baselines.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/pull_ensembles.yml‎
Lines changed: 67 additions & 0 deletions b/‎.github/workflows/pull_ensembles.yml‎
Lines changed: 67 additions & 0 deletions
diff --git a/‎auxiliary-data/pull-flusight-ensembles.R‎
Lines changed: 101 additions & 0 deletions b/‎auxiliary-data/pull-flusight-ensembles.R‎
Lines changed: 101 additions & 0 deletions
@@ -11,7 +11,7 @@ on:
         required: false
         default: true
   schedule:
-    - cron: "20 19 * * 3"
+    - cron: "10 17 * * 3"
 
 permissions:
     contents: write
 
@@ -0,0 +1,67 @@
+name: Pull ensembles
+on:
+  workflow_dispatch:
+    inputs:
+      name:
+        description: 'Pull Ensembles'
+        required: false
+      publish:
+        description: 'Pull ensemble forecasts'
+        type: boolean
+        required: false
+        default: true
+
+permissions:
+    contents: write
+    pull-requests: write
+
+jobs:
+  pull_ensembles:
+    if: github.repository_owner == 'cdcepi'
+    runs-on: macOS-latest
+    steps:    
+      - name: Checkout repo
+        uses: actions/checkout@v3
+        with: 
+          fetch-depth: 0
+      - name: Setup R 
+        uses: r-lib/actions/setup-r@v2
+        with:
+          use-public-rspm: true
+      - name: Install dependencies
+        run: |
+          install.packages("pak")
+          pak::pkg_install(c(
+          "readr", "dplyr", "tidyr",
+          "lubridate", "fs",
+          "github::hubverse-org/hubValidations"))
+        shell: Rscript {0}
+      - name: Pull ensemble csv files
+        run:  Rscript auxiliary-data/pull-flusight-ensembles.R
+      - name: Show validation output in logs (for debugging)
+        run: cat validation_result.md || echo "No validation_result.md found"
+      - name: Read validation result
+        id: validation
+        run: |
+          {
+            echo 'body<<EOF'
+            cat validation_result.md
+            echo 'EOF'
+          } >> "$GITHUB_OUTPUT"
+      - name: Commit changes and create PR 🚀
+        if: ${{ inputs.publish || github.event_name == 'schedule' }}
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+        run: |
+          PR_DATETIME=$(date +'%Y-%m-%d_%H-%M-%S')
+          git config user.name "github-actions[bot]"
+          git config user.email "41898282+github-actions[bot]@users.noreply.github.com"
+          git checkout -b pull/ensembles/"$PR_DATETIME"
+          git add .
+          git commit -m "Pull ensemble forecasts"
+          git push --set-upstream origin pull/ensembles/"$PR_DATETIME"
+          gh pr create --title "Add new ensemble forecasts" \
+            --body "${{ steps.validation.outputs.body }}" \
+            --base main \
+            --head pull/ensembles/"$PR_DATETIME"
+        shell: bash
@@ -0,0 +1,101 @@
+
+# Script that runs with the Pull ensembles action to download and save the weekly ensembles from the FluSight-ensemble repository.
+# Retrieves specifically FluSight-ensemble, FluSight-lop_norm, FluSight-trained_mean, FluSight-trained_median, FluSight-baseline_cat,FluSight-equal_cat, and 
+# FluSight-ens_q_cat.
+# Runs Hub Validations on the files.
+
+# Load required libraries
+library(lubridate)
+library(hubValidations)
+library(fs)
+
+# Prepare output file for PR body
+result_file <- "validation_result.md"
+
+# Wrap the entire script in a top-level tryCatch
+tryCatch({
+
+  # Set up reference date and file names
+  current_ref_date <- ceiling_date(Sys.Date(), "week") - days(1)
+  date_str <- format(current_ref_date, "%Y-%m-%d")
+
+  ensemble_types <- c("FluSight-ensemble", 
+                      "FluSight-lop_norm", 
+                      "FluSight-trained_mean", 
+                      "FluSight-trained_med", 
+                      "FluSight-baseline_cat", 
+                      "FluSight-equal_cat", 
+                      "FluSight-ens_q_cat")
+  ensemble_folders <- ensemble_types
+
+  downloaded_files <- c()
+  validation_results <- list()
+
+  for (i in seq_along(ensemble_types)) {
+    type <- ensemble_types[i]
+    folder <- ensemble_folders[i]
+    filename <- paste0(date_str, "-", type, ".csv")
+
+    file_url <- paste0(
+      "https://raw.githubusercontent.com/cdcepi/Flusight-ensemble/main/model-output/",
+      folder, "/", filename
+    )
+
+    target_dir <- file.path("model-output", type)
+    dir_create(target_dir, recurse = TRUE)
+    destfile <- file.path(target_dir, filename)
+
+    # Attempt to download
+    download_success <- tryCatch({
+      download.file(url = file_url, destfile = destfile, method = "libcurl")
+      cat("✅ Downloaded and saved:", destfile, "\n")
+      downloaded_files <- c(downloaded_files, file.path(type, filename))
+      TRUE
+    }, error = function(e) {
+      msg <- paste("❌ Failed to download", filename, "Reason:", e$message)
+      cat(msg, "\n")
+      validation_results[[file.path(type, filename)]] <- list(status = "error", message = msg)
+      FALSE
+    })
+
+    # Only attempt validation if download succeeded
+    if (download_success) {
+      file_path <- file.path(type, filename)
+      result <- tryCatch({
+        v <- hubValidations::validate_submission(hub_path = ".", file_path = file_path)
+
+        # Try to check for validation errors
+        err_msg <- tryCatch({
+          hubValidations::check_for_errors(v, verbose = TRUE)
+          NULL  # Passed
+        }, error = function(e) {
+          e$message  # Return error message
+        })
+
+        list(status = if (is.null(err_msg)) "pass" else "fail", message = err_msg)
+
+      }, error = function(e) {
+        list(status = "error", message = e$message)
+      })
+
+      validation_results[[file_path]] <- result
+    }
+  }
+
+  # Compose validation_result.md content
+  messages <- c("### 🧪 Validation Results")
+
+  for (file in names(validation_results)) {
+    res <- validation_results[[file]]
+    if (res$status == "pass") {
+      messages <- c(messages, paste0("✅ **", file, "** passed validation."))
+    } else {
+      messages <- c(messages, paste0("❌ **", file, "**: ", res$message))
+    }
+  }
+
+  writeLines(messages, result_file)
+
+}, error = function(e) {
+  writeLines(c("### 🧪 Validation Results", "❌ Script failed unexpectedly:", e$message), result_file)
+})