|
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 |
sudo apt update -y && sudo apt upgrade sudo apt install python3 && sudo apt install pip sudo apt install qemu-guest-agent sudo apt purge '*nvidia*' -y sudo apt remove --purge libnvidia-egl-wayland1:i386 libnvidia-fbc1-575:i386 screen-resolution-extra -y sudo apt autoremove dpkg -l | grep nvidia sudo apt install nvidia-driver-575-open -y sudo apt install nvidia-utils-575 -y sudo apt install nvidia-cuda-toolkit -y sudo dkms autoinstall sudo update-initramfs -u sudo reboot mkdir -p ~/miniconda3 wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh -O ~/miniconda3/miniconda.sh bash ~/miniconda3/miniconda.sh -b -u -p ~/miniconda3 rm ~/miniconda3/miniconda.sh sudo reboot source ~/miniconda3/bin/activate conda init --all conda create -n axolotl python=3.10 conda activate axolotl sudo apt install git -y git clone https://github.com/OpenAccess-AI-Collective/axolotl cd axolotl pip install -U packaging==23.2 setuptools==75.8.0 wheel ninja pip install --no-build-isolation axolotl[deepspeed] pip install --no-build-isolation -e '.[bitsandbytes]' pip install torch==2.7.1 torchvision==0.22.1+cu128 torchaudio==2.7.1 --index-url https://download.pytorch.org/whl/cu128 pip update flash-attn axolotl train fft-8b.yml accelerate launch -m axolotl.cli.train instruct-lora-8b.yml sudo update-initramfs -u sudo reboot |
Apply the Blackwell proxmox host crash fix to:
/etc/modprobe.d/nvidia-graphics-drivers-kms.conf
Solution: https://forum.level1techs.com/t/do-your-rtx-5090-or-general-rtx-50-series-has-reset-bug-in-vm-passthrough/228549/35