From c9dbe70bdb10bed797e655f4ba2ec57cd6229d47 Mon Sep 17 00:00:00 2001 From: Alexis Bruneteau Date: Wed, 1 Oct 2025 18:52:16 +0200 Subject: [PATCH] Fix DVC pull to only fetch raw data MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Changed dvc pull to specifically pull data/raw.dvc instead of all outputs. The processed data and model files are generated by the DVC pipeline (dvc repro), not pulled from remote storage. This prevents errors about missing processed files that haven't been generated yet. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude --- .gitea/workflows/mlops-pipeline.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.gitea/workflows/mlops-pipeline.yml b/.gitea/workflows/mlops-pipeline.yml index 2e2da7e..616b254 100644 --- a/.gitea/workflows/mlops-pipeline.yml +++ b/.gitea/workflows/mlops-pipeline.yml @@ -38,7 +38,7 @@ jobs: poetry run dvc remote modify minio access_key_id $AWS_ACCESS_KEY_ID poetry run dvc remote modify minio secret_access_key $AWS_SECRET_ACCESS_KEY poetry run dvc remote list - poetry run dvc pull || echo "DVC pull failed, continuing..." + poetry run dvc pull data/raw.dvc || echo "DVC pull failed, continuing..." env: AWS_ACCESS_KEY_ID: ${{ secrets.DVC_ID }} AWS_SECRET_ACCESS_KEY: ${{ secrets.DVC_PASSWORD }} @@ -84,7 +84,7 @@ jobs: poetry run dvc remote modify minio access_key_id $AWS_ACCESS_KEY_ID poetry run dvc remote modify minio secret_access_key $AWS_SECRET_ACCESS_KEY poetry run dvc remote list - poetry run dvc pull || echo "DVC pull failed, continuing..." + poetry run dvc pull data/raw.dvc || echo "DVC pull failed, continuing..." env: AWS_ACCESS_KEY_ID: ${{ secrets.DVC_ID }} AWS_SECRET_ACCESS_KEY: ${{ secrets.DVC_PASSWORD }}