From 73fcb3ef1519922ef583e55b7f9fb6399d53e0ef Mon Sep 17 00:00:00 2001 From: Virginia Partridge Date: Wed, 13 Mar 2024 14:49:17 -0400 Subject: [PATCH] Manual download zst conversion needs --stdout flag --- dvc.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/dvc.yaml b/dvc.yaml index e636264..5003963 100644 --- a/dvc.yaml +++ b/dvc.yaml @@ -4,7 +4,7 @@ stages: foreach: ${download_months} do: desc: Download Reddit comments data for the month ${item}. - cmd: curl https://files.pushshift.io/reddit/comments/RC_${item}.zst | unzstd --long=31 | bzip2 > ${comments_dir}/RC_${item}.bz2 + cmd: curl https://files.pushshift.io/reddit/comments/RC_${item}.zst | unzstd --long=31 | bzip2 > ${comments_dir}/RC_${item}.bz2 outs: - ${comments_dir}/RC_${item}.bz2 @@ -14,7 +14,7 @@ stages: foreach: ${manual_download_months} do: desc: Converting manually downloaded Reddit comments to bzip for month ${item}. - cmd: unzstd --long=31 ${manual_downloads_dir}/comments/RC_${item}.zst | bzip2 > ${comments_dir}/RC_${item}.bz2 + cmd: unzstd --stdout --long=31 ${manual_downloads_dir}/comments/RC_${item}.zst | bzip2 > ${comments_dir}/RC_${item}.bz2 outs: - ${comments_dir}/RC_${item}.bz2