A Rust and gRPC server for BLOOM Inference.
cd server pip install .
cd router cargo build --release
python server/bloom_inference/main.py bigscience/bloom --num-gpus 8 --shard-directory /dev/shm/models
./router/target/release/router