-
-
Notifications
You must be signed in to change notification settings - Fork 329
Expand file tree
/
Copy pathtest-gpt-oss.sh
More file actions
25 lines (22 loc) · 767 Bytes
/
test-gpt-oss.sh
File metadata and controls
25 lines (22 loc) · 767 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
#!/bin/bash
# Real Human Test: GPT-OSS with MoE CPU Offloading
# Let's see if this actually generates text!
echo "========================================="
echo "GPT-OSS MoE Test - Can it actually work?"
echo "========================================="
echo ""
echo "Model: GPT-OSS 20B Q4_K_M (11.6GB)"
echo "Hardware: RTX 3060 (4GB VRAM)"
echo "Test: Generate a simple response"
echo ""
echo "Starting generation..."
echo ""
NO_COLOR=1 SHIMMY_BASE_GGUF=./models/gpt-oss-20b-Q4_K_M.gguf \
./target/release/shimmy.exe --cpu-moe generate phi3-lora \
--prompt "Say hello and introduce yourself in one sentence." \
--max-tokens 50
echo ""
echo ""
echo "========================================="
echo "Test complete!"
echo "========================================="