From fa420c623a403b8630920c90e8262543dc97ba56 Mon Sep 17 00:00:00 2001 From: Aditya Purang <44022838+aditya-purang@users.noreply.github.com> Date: Thu, 11 Apr 2024 15:45:49 +0100 Subject: [PATCH] Update README.md to download training data from regions other than us-east-1 --- dp_bert_hf_pretrain/README.md | 2 ++ 1 file changed, 2 insertions(+) diff --git a/dp_bert_hf_pretrain/README.md b/dp_bert_hf_pretrain/README.md index 65901bc..5b6cb00 100644 --- a/dp_bert_hf_pretrain/README.md +++ b/dp_bert_hf_pretrain/README.md @@ -502,6 +502,8 @@ kubectl exec -it cmd-shell -- /bin/bash Run the following commands from within the bash prompt on the command shell pod: +NOTE : the bucket is in us-east-1 so you will need to add `--region us-east-1` to the `aws s3 cp` command if your cluster is not in us-east-1. + ``` cd /data aws s3 cp s3://neuron-s3/training_datasets/bert_pretrain_wikicorpus_tokenized_hdf5/bert_pretrain_wikicorpus_tokenized_hdf5_seqlen128.tar . --no-sign-request