mirror of
https://github.com/fauxpilot/fauxpilot.git
synced 2025-07-06 21:11:53 -07:00
Add python backend support
- Modify dockerfile to include bitsandbytes, transformers and latest version of pytorch - Minor modifications in utils/codegen.py so that same client works with FT and Py-backend - Minor modifications in launch.sh (no need to name models by GPU) - Add installation script for adding a new python model (with super simple config_template) - Modify setup.sh so that it aworks with both FT and Python backend models Signed-off-by: Parth Thakkar <thakkarparth007@gmail.com>
This commit is contained in:
parent
9b2bc84670
commit
01f1cbb629
9 changed files with 487 additions and 73 deletions
42
python_backend/init_model.py
Normal file
42
python_backend/init_model.py
Normal file
|
@ -0,0 +1,42 @@
|
|||
"""
|
||||
A simple script that sets up the model directory of a given model for Triton.
|
||||
"""
|
||||
|
||||
import argparse
|
||||
import shutil
|
||||
from pathlib import Path
|
||||
from string import Template
|
||||
|
||||
SCRIPT_DIR = Path(__file__).parent
|
||||
CONFIG_TEMPLATE_PATH = SCRIPT_DIR/'config_template.pbtxt'
|
||||
|
||||
parser = argparse.ArgumentParser()
|
||||
parser.add_argument("--model_dir", type=str, required=True)
|
||||
parser.add_argument("--model_name", type=str, required=True)
|
||||
parser.add_argument("--org_name", type=str, required=True)
|
||||
parser.add_argument("--use_half", type=str, default="1")
|
||||
parser.add_argument("--use_int8", type=str, default="0")
|
||||
parser.add_argument("--use_auto_device_map", type=str, default="1")
|
||||
args = parser.parse_args()
|
||||
|
||||
|
||||
# Step1: Make model directory
|
||||
model_dir_path = Path(args.model_dir)/f"py-{args.model_name}/py-model/1"
|
||||
model_dir_path.mkdir(parents=True, exist_ok=True)
|
||||
|
||||
# Step 2: copy model.py
|
||||
shutil.copy(SCRIPT_DIR/'model.py', model_dir_path/'model.py')
|
||||
|
||||
# Step 3: Generate config.pbtxt
|
||||
with open(CONFIG_TEMPLATE_PATH, 'r') as f:
|
||||
template = Template(f.read())
|
||||
|
||||
config = template.substitute(
|
||||
org_name=args.org_name,
|
||||
model_name=args.model_name,
|
||||
use_half=args.use_half,
|
||||
use_int8=args.use_int8,
|
||||
use_auto_device_map=args.use_auto_device_map,
|
||||
)
|
||||
with open(model_dir_path/'../config.pbtxt', 'w') as f:
|
||||
f.write(config)
|
Loading…
Add table
Add a link
Reference in a new issue