Goals: Add links that are reasonable and good explanations of how stuff works. No hype and no vendor content if possible. Practical first-hand accounts of models in prod eagerly sought.
data:image/s3,"s3://crabby-images/ad1fa/ad1fae02609473a3f11c48b1064a641deef5171b" alt="Screenshot 2023-12-18 at 10 40 27 PM"
sudo apt-get remove --purge '^nvidia-.*' | |
sudo ubuntu-drivers autoinstall | |
sudo reboot |
import pytorch_lightning as pl | |
... | |
# override this method on pytorch-lightning model | |
def on_predict_epoch_end(self, results): | |
# gather all results onto each device | |
# find created world_size from pl.trainer | |
results = all_gather(results[0], WORLD_SIZE, self._device) | |
# concatenate on the cpu | |
results = torch.concat([x.cpu() for x in results], dim=1) | |
# output will not preserve input order. |
# NOTE: | |
# You can find an updated, more robust and feature-rich implementation | |
# in Zeno Build | |
# - Zeno Build: https://github.com/zeno-ml/zeno-build/ | |
# - Implementation: https://github.com/zeno-ml/zeno-build/blob/main/zeno_build/models/providers/openai_utils.py | |
import openai | |
import asyncio | |
from typing import Any |