Files
llmsecops-research/run.sh

36 lines
1.2 KiB
Bash
Executable File

#!/usr/bin/bash
# create Python virtual environment
python3.12 -m venv .env
source .env/bin/activate
# the ONNX model/data require git Large File System support
git lfs install
# install Python dependencies
# pip install huggingface-hub[cli] langchain langchain_huggingface langchain_community optimum[onnxruntime] faiss-cpu
pip install -r ./requirements.txt
# environment variables
export MODEL_BASE_DIR="./infrastructure/foundation_model"
export MODEL_CPU_DIR="cpu_and_mobile/cpu-int4-rtn-block-32-acc-level-4"
MODEL_DATA_FILENAME="phi3-mini-4k-instruct-cpu-int4-rtn-block-32-acc-level-4.onnx.data"
MODEL_DATA_FILEPATH="$MODEL_BASE_DIR/$MODEL_CPU_DIR/$MODEL_DATA_FILENAME"
echo "==================="
echo "$MODEL_DATA_FILEPATH"
echo "==================="
# get foundation model dependencies from HuggingFace / Microsoft
if [ ! -f "$MODEL_DATA_FILEPATH" ]; then
echo "Downloading foundation model..."
huggingface-cli download microsoft/Phi-3-mini-4k-instruct-onnx \
--include "$MODEL_CPU_DIR/*" \
--local-dir $MODEL_BASE_DIR
else
echo "Foundation model files already exist at: $MODEL_DATA_FILEPATH"
fi
python -m src.text_generation.entrypoints.server