Deployed 9fe2955 with MkDocs version: 1.4.3

argonne-lcf · Jun 27, 2023 · 5c88707 · 5c88707
commit 5c88707
Show file tree

Hide file tree

Showing 587 changed files with 1,528,063 additions and 0 deletions.
diff --git a/.nojekyll b/.nojekyll
diff --git a/404.html b/404.html
diff --git a/account-project-management/accounts-and-access/accounts-and-access-faqs/index.html b/account-project-management/accounts-and-access/accounts-and-access-faqs/index.html
diff --git a/account-project-management/accounts-and-access/alcf-passcode-tokens/index.html b/account-project-management/accounts-and-access/alcf-passcode-tokens/index.html
diff --git a/account-project-management/accounts-and-access/user-account-overview/index.html b/account-project-management/accounts-and-access/user-account-overview/index.html
diff --git a/account-project-management/allocation-management/allocation-management/index.html b/account-project-management/allocation-management/allocation-management/index.html
diff --git a/account-project-management/allocation-management/files/allocation.png b/account-project-management/allocation-management/files/allocation.png
diff --git a/account-project-management/allocation-management/files/request-allocation.png b/account-project-management/allocation-management/files/request-allocation.png
diff --git a/account-project-management/allocation-management/overview/index.html b/account-project-management/allocation-management/overview/index.html
diff --git a/...nt-project-management/allocation-management/sbank-allocation-accounting-system/index.html b/...nt-project-management/allocation-management/sbank-allocation-accounting-system/index.html
diff --git a/account-project-management/allocation-management/sbank-detail-allocations/index.html b/account-project-management/allocation-management/sbank-detail-allocations/index.html
diff --git a/account-project-management/allocation-management/sbank-detail-jobs/index.html b/account-project-management/allocation-management/sbank-detail-jobs/index.html
diff --git a/account-project-management/allocation-management/sbank-detail-projects/index.html b/account-project-management/allocation-management/sbank-detail-projects/index.html
diff --git a/account-project-management/allocation-management/sbank-detail-transactions/index.html b/account-project-management/allocation-management/sbank-detail-transactions/index.html
diff --git a/account-project-management/allocation-management/sbank-detail-users/index.html b/account-project-management/allocation-management/sbank-detail-users/index.html
diff --git a/account-project-management/allocation-management/sbank-detail/index.html b/account-project-management/allocation-management/sbank-detail/index.html
diff --git a/account-project-management/allocation-management/sbank-examples/index.html b/account-project-management/allocation-management/sbank-examples/index.html
diff --git a/account-project-management/allocation-management/sbank-list-allocations/index.html b/account-project-management/allocation-management/sbank-list-allocations/index.html
diff --git a/account-project-management/allocation-management/sbank-list-jobs/index.html b/account-project-management/allocation-management/sbank-list-jobs/index.html
diff --git a/account-project-management/allocation-management/sbank-list-projects/index.html b/account-project-management/allocation-management/sbank-list-projects/index.html
diff --git a/account-project-management/allocation-management/sbank-list-transactions/index.html b/account-project-management/allocation-management/sbank-list-transactions/index.html
diff --git a/account-project-management/allocation-management/sbank-list-users/index.html b/account-project-management/allocation-management/sbank-list-users/index.html
diff --git a/account-project-management/allocation-management/sbank-list/index.html b/account-project-management/allocation-management/sbank-list/index.html
diff --git a/account-project-management/allocation-management/sbank-manpage/index.html b/account-project-management/allocation-management/sbank-manpage/index.html
diff --git a/account-project-management/project-management/files/PINAME_ALLOCATION_YEARS_EOP.docx b/account-project-management/project-management/files/PINAME_ALLOCATION_YEARS_EOP.docx
diff --git a/account-project-management/project-management/files/PINAME_ALLOCATION_YEAR_EOY.docx b/account-project-management/project-management/files/PINAME_ALLOCATION_YEAR_EOY.docx
diff --git a/account-project-management/project-management/files/PINAME_ALLOCATION_YEAR_QX.docx b/account-project-management/project-management/files/PINAME_ALLOCATION_YEAR_QX.docx
diff --git a/account-project-management/project-management/files/accounts-app.png b/account-project-management/project-management/files/accounts-app.png
diff --git a/account-project-management/project-management/files/project-management-1.png b/account-project-management/project-management/files/project-management-1.png
diff --git a/account-project-management/project-management/files/project-management-2.png b/account-project-management/project-management/files/project-management-2.png
diff --git a/account-project-management/project-management/files/project-management-3.png b/account-project-management/project-management/files/project-management-3.png
diff --git a/account-project-management/project-management/files/project-management-4.png b/account-project-management/project-management/files/project-management-4.png
diff --git a/account-project-management/project-management/project-reports/index.html b/account-project-management/project-management/project-reports/index.html
diff --git a/account-project-management/project-management/starting-alcf-award/index.html b/account-project-management/project-management/starting-alcf-award/index.html
diff --git a/account-project-management/project-management/team-management/index.html b/account-project-management/project-management/team-management/index.html
diff --git a/ai-testbed/cerebras/customizing-environment/index.html b/ai-testbed/cerebras/customizing-environment/index.html
diff --git a/ai-testbed/cerebras/example-programs/index.html b/ai-testbed/cerebras/example-programs/index.html
diff --git a/ai-testbed/cerebras/files/Cerebras-connectivity-diagram.png b/ai-testbed/cerebras/files/Cerebras-connectivity-diagram.png
diff --git a/ai-testbed/cerebras/files/Cerebras_Wafer-Scale_Cluster_login_diagram.png b/ai-testbed/cerebras/files/Cerebras_Wafer-Scale_Cluster_login_diagram.png
diff --git a/ai-testbed/cerebras/files/compile-vs-run.png b/ai-testbed/cerebras/files/compile-vs-run.png
diff --git a/ai-testbed/cerebras/files/cs-getting-started.png b/ai-testbed/cerebras/files/cs-getting-started.png
diff --git a/ai-testbed/cerebras/getting-started/index.html b/ai-testbed/cerebras/getting-started/index.html
diff --git a/ai-testbed/cerebras/index.html b/ai-testbed/cerebras/index.html
diff --git a/ai-testbed/cerebras/job-queuing-and-submission/index.html b/ai-testbed/cerebras/job-queuing-and-submission/index.html
diff --git a/ai-testbed/cerebras/miscellaneous/index.html b/ai-testbed/cerebras/miscellaneous/index.html
diff --git a/ai-testbed/cerebras/performance-tools/index.html b/ai-testbed/cerebras/performance-tools/index.html
diff --git a/ai-testbed/cerebras/running-a-model-or-program/index.html b/ai-testbed/cerebras/running-a-model-or-program/index.html
diff --git a/ai-testbed/cerebras/system-overview/index.html b/ai-testbed/cerebras/system-overview/index.html
diff --git a/ai-testbed/cerebras/tunneling-and-forwarding-ports/index.html b/ai-testbed/cerebras/tunneling-and-forwarding-ports/index.html
diff --git a/ai-testbed/data-management/data-management-overview/index.html b/ai-testbed/data-management/data-management-overview/index.html
diff --git a/ai-testbed/files/dictionary.txt b/ai-testbed/files/dictionary.txt
@@ -0,0 +1,84 @@
+aitestbed
+ALCFUserID
+analyser
+ANL
+arnoldw
+AUTOTUNE
+Cerebras
+conv
+cosmictagger
+cpus
+cuda
+cudart
+DATADIR
+dlerror
+dlopen
+elif
+finetune
+flos
+gbps
+GEMM
+Graphcore
+graphcore_login
+gres
+inet
+inplace
+jsons
+kaggle
+keras
+keygen
+keyscan
+layernorm
+lenet
+libcudart
+libnvinfer
+LOGDIR
+logreg
+mgmt
+mnist
+MNIST
+modelzoo
+nodelist
+ntasks
+OUTDIR
+passcode
+petaFLOPS
+POPART
+POPLIBS
+poptorch
+popvision
+pretrain
+pretraining
+PYTHONPATH
+relu
+RELU
+resnet
+run_unet_256_256_single_4
+SambaFlow
+sambanova
+sbatch
+scancel
+Slurm
+snconfig
+snpath
+snthreads
+sntilestat
+snvenv
+softmax
+squeue
+SRAM
+srun
+tensorrt
+tf2tensorrt
+TFLOPs
+unet
+UNet
+unet
+unet_compile_run_all
+Venkat
+venv
+venvs
+vipu
+virtualenv
+wilsonb
+XRDU
diff --git a/ai-testbed/files/example-multi-node-programs.sh b/ai-testbed/files/example-multi-node-programs.sh
@@ -0,0 +1,64 @@
+#! /bin/bash -x
+set -e
+#
+# Usage: ./unet_all.sh 256 256
+#
+SECONDS=0
+
+# IMage size.
+IM=${1}
+# Batch Size
+BS=${2}
+NUM_WORKERS=1
+export OMP_NUM_THREADS=16
+
+source /opt/sambaflow/venv/bin/activate
+UNET=$(pwd)/unet
+
+echo "Model: UNET"
+echo "Date: " $(date +%m/%d/%y)
+echo "Time: " $(date +%H:%M)
+
+echo "COMPILE"
+
+# Compile for parallel RDUs
+if [ ! -e out/unet_train_${BS}_${IM}_NN/unet_train_${BS}_${IM}_NN.pef ] ; then
+  python ${UNET}/unet.py compile -b ${BS} --in-channels=3 --in-width=${IM} --in-height=${IM} --enable-conv-tiling --mac-v2 --compiler-configs-file ${UNET}/jsons/compiler_configs/unet_compiler_configs_no_inst.json --pef-name="unet_train_${BS}_${IM}_NN"  --data-parallel -ws 2 > compile_${BS}_${IM}_NN.log 2>&1
+fi
+
+# Run Multi-Node, Data Parallel
+NN=2
+echo "RUN"
+echo "NN=${NN}"
+sbatch --gres=rdu:1 --tasks-per-node 8  --nodes 2 --nodelist sm-02,sm-01 --cpus-per-task=16 ./unet_batch.sh ${NN} ${NUM_WORKERS}
+echo "Duration: " $SECONDS
+
+#! /bin/bash -x
+set -e
+#
+# Usage: ./unet_batch.sh 2 1
+#
+SECONDS=0
+
+# Batch Size
+BS=256
+
+# IMage size
+IM=256
+NN=${1}
+NUM_WORKERS=${2}
+export OMP_NUM_THREADS=16
+DATADIR=/software/sambanova/dataset/kaggle_3m
+UNET=$(pwd)/unet
+export SAMBA_CCL_USE_PCIE_TRANSPORT=0
+
+# TODO: Update this.
+source /opt/sambaflow/venv/bin/activate
+
+echo "Model: UNET_TRAIN"
+echo "Date: " $(date +%m/%d/%y)
+echo "Time: " $(date +%H:%M)
+
+srun --mpi=pmi2 python ${UNET}/unet_hook.py  run --do-train --in-channels=3 --in-width=${IM} --in-height=${IM} --init-features 32 --batch-size=${BS} --epochs 2   --data-dir ${DATADIR} --log-dir log_dir_unet_${NN}_train_kaggle --pef=$(pwd)/out/unet_train_${BS}_${IM}_NN/unet_train_${BS}_${IM}_NN.pef --data-parallel --reduce-on-rdu --num-workers=${NUM_WORKERS}
+
+echo "Duration: " $SECONDS
diff --git a/ai-testbed/files/home-cerebras-sambanova.png b/ai-testbed/files/home-cerebras-sambanova.png