Dockerize (#22)

* created Dockerfile and docker-compose.yml * Update docker-compose.yml * added docker instructions to readme
2024-08-22 02:00:42 -07:00
parent ec3c225a0f
commit 8096f91d02
6 changed files with 72 additions and 2 deletions
--- a/.dockerignore
+++ b/.dockerignore
@@ -0,0 +1,6 @@
 tmp
 cache
 Dockerfile
 docker-compose.yml
 .dockerignore
 .gitignore
--- a/.gitignore
+++ b/.gitignore
@@ -1,2 +1,3 @@
 __pycache__
-tmp
+tmp
 cache
--- a/13
+++ b/13
@@ -0,0 +1,13 @@
 FROM pytorch/pytorch:2.4.0-cuda12.1-cudnn9-devel
 ENV PYTHONUNBUFFERED 1
 WORKDIR /usr/src/app
 # Install packages
 RUN apt-get update && apt-get install -y git && rm -rf /var/lib/apt/lists/*
 COPY requirements.txt ./
 RUN pip install --no-cache-dir -r requirements.txt
 COPY . .
--- a/README.md
+++ b/README.md
@@ -12,6 +12,7 @@
  - [Modularity](#modularity)
 * [Setup](#setup)
 * [Usage](#usage)
  - [Docker Server approach](#docker-server)
  - [Server/Client approach](#serverclient-approach)
  - [Local approach](#local-approach)
 * [Command-line usage](#command-line-usage)
@@ -56,6 +57,15 @@ The pipeline can be run in two ways:
 - **Server/Client approach**: Models run on a server, and audio input/output are streamed from a client.
 - **Local approach**: Uses the same client/server method but with the loopback address.
 ### Docker Server
 #### Install the NVIDIA Container Toolkit
 https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html
 #### Start the docker container
 ```docker compose up```
 ### Server/Client Approach
 To run the pipeline on the server:
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -0,0 +1,40 @@
 ---
 version: "3.8"
 services:
  pipeline:
    build:
      context: .
    command: 
      - python3 
      - s2s_pipeline.py 
      - --recv_host 
      - 0.0.0.0 
      - --send_host 
      - 0.0.0.0 
      - --lm_model_name 
      - microsoft/Phi-3-mini-4k-instruct 
      - --init_chat_role 
      - system
      - --init_chat_prompt
      - "You are a helpful assistant"
      - --stt_compile_mode 
      - reduce-overhead 
      - --tts_compile_mode 
      - default
    expose:
      - 12345/tcp
      - 12346/tcp
    ports:
      - 12345:12345/tcp
      - 12346:12346/tcp
    volumes:
      - ./cache/:/root/.cache/
      - ./s2s_pipeline.py:/usr/src/app/s2s_pipeline.py
    deploy:
      resources:
        reservations:
          devices:
            - driver: nvidia
              device_ids: ['0']
              capabilities: [gpu]
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,4 +1,4 @@
-nltk==3.8.1
+nltk==3.9.1
 parler_tts @ git+https://github.com/huggingface/parler-tts.git
 torch==2.4.0
 sounddevice==0.5.0