mirror of
https://github.com/RichieCahill/dotfiles.git
synced 2026-04-17 21:18:18 -04:00
deleted train.sh
This commit is contained in:
@@ -1,45 +0,0 @@
|
||||
#!/usr/bin/env bash
|
||||
# Fine-tune Qwen 3.5 4B on bill summarization data.
|
||||
#
|
||||
# Prerequisites:
|
||||
# 1. Build the dataset: python -m python.prompt_bench.build_finetune_dataset
|
||||
# 2. Build the image: docker build -f python/prompt_bench/Dockerfile.finetune -t bill-finetune .
|
||||
#
|
||||
# Usage:
|
||||
# bash python/prompt_bench/train.sh [extra flags passed to finetune.py]
|
||||
#
|
||||
# Examples:
|
||||
# bash python/prompt_bench/train.sh
|
||||
# bash python/prompt_bench/train.sh --epochs 5 --lr 1e-4
|
||||
# bash python/prompt_bench/train.sh --val-split 0.15 --save-gguf
|
||||
|
||||
set -euo pipefail
|
||||
|
||||
IMAGE="bill-finetune"
|
||||
DATASET="$(pwd)/output/finetune_dataset.jsonl"
|
||||
OUTPUT_DIR="$(pwd)/output/qwen-bill-summarizer"
|
||||
|
||||
if [ ! -f "$DATASET" ]; then
|
||||
echo "Error: Dataset not found at $DATASET"
|
||||
echo "Run: python -m python.prompt_bench.build_finetune_dataset"
|
||||
exit 1
|
||||
fi
|
||||
|
||||
mkdir -p "$OUTPUT_DIR"
|
||||
|
||||
echo "Starting fine-tuning..."
|
||||
echo " Dataset: $DATASET"
|
||||
echo " Output: $OUTPUT_DIR"
|
||||
echo " Extra args: $*"
|
||||
|
||||
docker run --rm \
|
||||
--device=nvidia.com/gpu=all \
|
||||
--ipc=host \
|
||||
-v "$OUTPUT_DIR":/workspace/output/qwen-bill-summarizer \
|
||||
-v "$DATASET":/workspace/dataset.jsonl:ro \
|
||||
"$IMAGE" \
|
||||
--dataset /workspace/dataset.jsonl \
|
||||
--output-dir /workspace/output/qwen-bill-summarizer \
|
||||
"$@"
|
||||
|
||||
echo "Done! Model saved to $OUTPUT_DIR"
|
||||
Reference in New Issue
Block a user