Skip to content

Commit aac3441

Browse files
committed
feat: update examples to public lora
1 parent 1645884 commit aac3441

File tree

2 files changed

+13
-17
lines changed

2 files changed

+13
-17
lines changed

examples/backends/vllm/launch/lora/agg_lora_s3.sh

Lines changed: 8 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -35,34 +35,29 @@ DYN_SYSTEM_ENABLED=true DYN_SYSTEM_PORT=8081 \
3535
python -m dynamo.vllm --model Qwen/Qwen3-0.6B --enforce-eager \
3636
--connector none \
3737
--enable-lora \
38-
--max-lora-rank 32
38+
--max-lora-rank 64
3939

4040
################################## Example Usage ##################################
4141

4242
# Check available models
4343
curl http://localhost:8000/v1/models | jq .
4444

4545
# Load LoRA using s3 uri
46-
curl -X POST http://localhost:8081/v1/loras \
47-
-H "Content-Type: application/json" \
48-
-d '{
49-
"lora_name": "Neural-Hacker/Qwen3-Math-Reasoning-LoRA",
50-
"source": {
51-
"uri": "s3://my-loras/Neural-Hacker/Qwen3-Math-Reasoning-LoRA"
52-
}
53-
}'
46+
curl -s -X POST http://localhost:8081/v1/loras \
47+
-H "Content-Type: application/json" \
48+
-d '{"lora_name": "codelion/Qwen3-0.6B-accuracy-recovery-lora",
49+
"source": {"uri": "s3://my-loras/codelion/Qwen3-0.6B-accuracy-recovery-lora"}}' | jq .
5450

5551
# Test LoRA inference
5652
curl -X POST http://localhost:8000/v1/chat/completions \
5753
-H "Content-Type: application/json" \
5854
-d '{
59-
"model": "Neural-Hacker/Qwen3-Math-Reasoning-LoRA",
60-
"messages": [{"role": "user", "content": "Solve (x*x - x + 1 = 0) for x"}],
55+
"model": "codelion/Qwen3-0.6B-accuracy-recovery-lora",
56+
"messages": [{"role": "user", "content": "What is deep learning?"}],
6157
"max_tokens": 300,
6258
"temperature": 0.0
6359
}'
6460

65-
# Find the minimum possible value of \( x^2 + y^2 \) given that \( x \) and \( y \) are real numbers satisfying \( xy(x^2 - y^2) = x^2 + y^2 \) and \( x \neq 0 \)
6661
# Test base model inference (for comparison)
6762
curl -X POST http://localhost:8000/v1/chat/completions \
6863
-H "Content-Type: application/json" \
@@ -74,4 +69,4 @@ curl -X POST http://localhost:8000/v1/chat/completions \
7469
}'
7570

7671
# Unload LoRA
77-
curl -X DELETE http://localhost:8081/v1/loras/Neural-Hacker/Qwen3-Math-Reasoning-LoRA
72+
curl -X DELETE http://localhost:8081/v1/loras/codelion/Qwen3-0.6B-accuracy-recovery-lora

examples/backends/vllm/launch/lora/setup_minio.sh

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -20,8 +20,8 @@ MINIO_SECRET_KEY="minioadmin"
2020
BUCKET_NAME="my-loras"
2121

2222
# Default LoRA to download (can be overridden)
23-
HF_LORA_REPO="${HF_LORA_REPO:-Neural-Hacker/Qwen3-Math-Reasoning-LoRA}"
24-
LORA_NAME="${LORA_NAME:-Neural-Hacker/Qwen3-Math-Reasoning-LoRA}"
23+
HF_LORA_REPO="${HF_LORA_REPO:-codelion/Qwen3-0.6B-accuracy-recovery-lora}"
24+
LORA_NAME="${LORA_NAME:-codelion/Qwen3-0.6B-accuracy-recovery-lora}"
2525
# TEMP_DIR will be created using mktemp when needed
2626
TEMP_DIR=""
2727

@@ -63,8 +63,8 @@ show_help() {
6363
echo " --help, -h Show this help message"
6464
echo ""
6565
echo "Environment Variables:"
66-
echo " HF_LORA_REPO Hugging Face repository (default: ${HF_LORA_REPO:-Neural-Hacker/Qwen3-Math-Reasoning-LoRA})"
67-
echo " LORA_NAME Local name for the LoRA (default: ${LORA_NAME:-Neural-Hacker/Qwen3-Math-Reasoning-LoRA})"
66+
echo " HF_LORA_REPO Hugging Face repository (default: ${HF_LORA_REPO:-codelion/Qwen3-0.6B-accuracy-recovery-lora})"
67+
echo " LORA_NAME Local name for the LoRA (default: ${LORA_NAME:-codelion/Qwen3-0.6B-accuracy-recovery-lora})"
6868
echo ""
6969
echo "Examples:"
7070
echo " $0 # Full setup"
@@ -173,6 +173,7 @@ download_lora_from_hf() {
173173

174174
print_success "LoRA downloaded to ${TEMP_DIR}"
175175

176+
rm -rf "${TEMP_DIR}/.cache"
176177
# List downloaded files
177178
echo "Downloaded files:"
178179
ls -lh "${TEMP_DIR}"

0 commit comments

Comments
 (0)