| 
					
				 | 
			
			
				@@ -1,56 +0,0 @@ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-# Copyright (c) 2020 NVIDIA Corporation.  All rights reserved. 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-#!/usr/bin/env bash 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-cp create_dir_and_download_pytorch_sif_file.sh ../../../../../../ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-cd ../../../../../../ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-mkdir output 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-mkdir output/sv_gpt3_ckpt/ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-mkdir dataset 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-# gdrive_download pre-built **pytorch_21.03.sif** which is needed to run singularity  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-# script to download Google Drive files from command line 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-# not guaranteed to work indefinitely 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-# taken from Stack Overflow answer: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-# http://stackoverflow.com/a/38937732/7002068 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-gURL=https://drive.google.com/file/d/18-QSZhPhNJS3m9ASTPkjnzsFVgg71MNx/view?usp=sharing 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-# match more than 26 word characters 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-ggID=$(echo "$gURL" | egrep -o '(\w|-){26,}') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-ggURL='https://drive.google.com/uc?export=download' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-curl -sc /tmp/gcokie "${ggURL}&id=${ggID}" >/dev/null 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-getcode="$(awk '/_warning_/ {print $NF}' /tmp/gcokie)" 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-cmd='curl --insecure -C - -LOJb /tmp/gcokie "${ggURL}&confirm=${getcode}&id=${ggID}"' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-echo -e "Downloading from "$gURL"...\n" 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-eval $cmd 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-# gdrive_download toy dataset  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-gURL=https://drive.google.com/file/d/17hIXwG6jHgijmBJKq2Z211Hm6AXfQo9C/view?usp=sharing 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-# match more than 26 word characters 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-ggID=$(echo "$gURL" | egrep -o '(\w|-){26,}') 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-ggURL='https://drive.google.com/uc?export=download' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-curl -sc /tmp/gcokie "${ggURL}&id=${ggID}" >/dev/null 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-getcode="$(awk '/_warning_/ {print $NF}' /tmp/gcokie)" 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-cmd='curl --insecure -C - -LOJb /tmp/gcokie "${ggURL}&confirm=${getcode}&id=${ggID}"' 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-echo -e "Downloading from "$gURL"...\n" 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-eval $cmd 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-### move toy data to correct dirs 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-mv toydata.zip ./dataset/ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-cd dataset/ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-unzip -r toydata.zip 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-cd .. 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-### move the Megatron run script to the correct directory 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-cp ./gpubootcamp/ai/Megatron/English/Python/source_code/Day1-runMegatron-LM_GPT_template.sh ./ 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				- 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-### clone Megatron-LM repo onto the current dir 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-git clone https://github.com/NVIDIA/Megatron-LM.git 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-ls . 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-echo "done !" 
			 |