How to use Phison aiDAPTIV+

Phison-aiDAPTIV-plus.png

# Install LVM

sudo apt update

sudo apt install lvm2 xfsprogs

lshw -class disk -class storage | grep -E 'ai100|logical name|version: EIFZ'

lsblk | grep nvme

# Dangerous!!! Need to make sure number is right!!!

sudo wipefs -a /dev/nvme0n1 /dev/nvme1n1

# Create LVM

sudo pvcreate /dev/nvme0n1 /dev/nvme1n1

sudo vgcreate ai /dev/nvme0n1 /dev/nvme1n1

sudo lvcreate --type striped -i 2 -I 128k -l 100%FREE -n ai ai

# Mount LVM

# Format the disk.

sudo mkfs.xfs -f -s size=4k -m crc=0 /dev/ai/ai -f

# Mount the disk.

sudo mkdir -p /mnt/nvme0

sudo mount /dev/ai/ai /mnt/nvme0

sudo chown -R $USER:$USER /mnt/nvme0

# Make mount persistent

sudo echo '/dev/ai/ai /mnt/nvme0 xfs defaults,nofail 0 0' | sudo tee -a /etc/fstab

# Remove permanent mount setting #sudo sed -i '//dev/ai/ai/d' /etc/fstab

# Check disk status

lsblk

# If you need to dissolve LVM Setting

# sudo umount /mnt/nvme0;sudo lvremove -y ai;sudo pvremove -y /dev/ nvme1n1 /dev/nvme2n1 -- force --force

# If you only have one SSD, please follow the steps below to mount

#sudo mkfs -t ext4 /dev/nvme1n1

#sudo mkdir -p /mnt/nvme0

#sudo mount /dev/nvme1n1 /mnt/nvme0

#sudo chown -R $USER:$USER /mnt/nvme0

cd

sudo mkdir -p /data/llm_train

sudo chown -R $USER:$USER /data

cd /data/llm_train

wget https://d.leaderg.com/aidaptiv/train-Llama-3.1-8B-Instruct.7z

7z x train-Llama-3.1-8B-Instruct.7z

cd /data/llm_train/train-Llama-3.1-8B-Instruct/model

# Hugging Face

# read token hf_xxxxx

# Install python environment 

pip install -U "huggingface_hub[cli]"

huggingface-cli download --token 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 --resume-download meta-llama/Llama-3.1-8B-Instruct --local-dir-use-symlinks False --local-dir Llama-3.1-8B-Instruct

mkdir -p /data/llm_train/aidaptiv

cd /data/llm_train/aidaptiv

wget https://phisonbucket.s3.ap-northeast-1.amazonaws.com/aiDAPTIV_vNXUN_2_01_00.tar.gz

sudo docker load < aiDAPTIV_vNXUN_2_01_00.tar.gz

sudo docker image list

sudo docker run --gpus all -it --ipc=host --privileged=true --ulimit memlock=-1 --ulimit stack=67108864 -v /data/llm_train/train-Llama-3.1-8B-Instruct:/app -v /mnt/nvme0:/mnt -v /dev/mapper:/dev/mapper aidaptiv:vNXUN_2_01_00

cd /app

cd commands

bash example.sh

# List all docker containers

sudo docker ps -a

# Remove docker container

sudo docker stop <CONTAINER ID>

# Remove docker container

sudo docker rm <CONTAINER ID>