1
0

test_book.sh 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561
  1. #!/usr/bin/env bash
  2. set -euo pipefail
  3. # =============================================================================
  4. # test_book.sh — LLM App Tutorial (Ch1–Ch5) E2E Test
  5. #
  6. # Code is extracted from the doc markdown files (<!-- test:full-code --> and
  7. # <!-- test:cmake --> markers), so tests always stay in sync with the docs.
  8. # =============================================================================
  9. SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
  10. PROJECT_ROOT="$(cd "$SCRIPT_DIR/../.." && pwd)"
  11. DOCS_DIR="$PROJECT_ROOT/docs-src/pages/ja/llm-app"
  12. WORKDIR=$(mktemp -d)
  13. MODEL_NAME="gemma-2-2b-it-Q4_K_M.gguf"
  14. MODEL_URL="https://huggingface.co/bartowski/gemma-2-2b-it-GGUF/resolve/main/${MODEL_NAME}"
  15. PORT=18080
  16. GECKODRIVER_PORT=4444
  17. SERVER_PID=""
  18. GECKODRIVER_PID=""
  19. PASS_COUNT=0
  20. FAIL_COUNT=0
  21. # ---------------------------------------------------------------------------
  22. # Cleanup
  23. # ---------------------------------------------------------------------------
  24. cleanup() {
  25. if [[ -n "$SERVER_PID" ]]; then
  26. kill "$SERVER_PID" 2>/dev/null || true
  27. wait "$SERVER_PID" 2>/dev/null || true
  28. fi
  29. if [[ -n "$GECKODRIVER_PID" ]]; then
  30. kill "$GECKODRIVER_PID" 2>/dev/null || true
  31. wait "$GECKODRIVER_PID" 2>/dev/null || true
  32. fi
  33. rm -rf "$WORKDIR"
  34. }
  35. trap cleanup EXIT
  36. # ---------------------------------------------------------------------------
  37. # Helpers
  38. # ---------------------------------------------------------------------------
  39. log() { echo "=== $*"; }
  40. pass() { echo " PASS: $*"; PASS_COUNT=$((PASS_COUNT + 1)); }
  41. fail() { echo " FAIL: $*"; FAIL_COUNT=$((FAIL_COUNT + 1)); }
  42. source "$SCRIPT_DIR/extract_code.sh"
  43. wait_for_server() {
  44. local max_wait=30
  45. local i=0
  46. while ! curl -s -o /dev/null "http://127.0.0.1:${PORT}/" 2>/dev/null; do
  47. sleep 1
  48. i=$((i + 1))
  49. if [[ $i -ge $max_wait ]]; then
  50. fail "Server did not start within ${max_wait}s"
  51. return 1
  52. fi
  53. done
  54. }
  55. stop_server() {
  56. if [[ -n "$SERVER_PID" ]]; then
  57. kill "$SERVER_PID" 2>/dev/null || true
  58. wait "$SERVER_PID" 2>/dev/null || true
  59. SERVER_PID=""
  60. fi
  61. }
  62. # Make an HTTP request and capture status + body
  63. # Usage: http_request METHOD PATH [DATA]
  64. # Sets: HTTP_STATUS, HTTP_BODY
  65. http_request() {
  66. local method="$1" path="$2" data="${3:-}"
  67. local tmp
  68. tmp=$(mktemp)
  69. if [[ -n "$data" ]]; then
  70. HTTP_STATUS=$(curl -s -o "$tmp" -w '%{http_code}' \
  71. -X "$method" "http://127.0.0.1:${PORT}${path}" \
  72. -H "Content-Type: application/json" \
  73. -d "$data")
  74. else
  75. HTTP_STATUS=$(curl -s -o "$tmp" -w '%{http_code}' \
  76. -X "$method" "http://127.0.0.1:${PORT}${path}")
  77. fi
  78. HTTP_BODY=$(cat "$tmp")
  79. rm -f "$tmp"
  80. }
  81. # Make an SSE request and capture the raw stream
  82. # Usage: http_sse PATH DATA
  83. # Sets: HTTP_STATUS, HTTP_BODY
  84. http_sse() {
  85. local path="$1" data="$2"
  86. HTTP_SSE_FILE=$(mktemp)
  87. HTTP_STATUS=$(curl -s -N -o "$HTTP_SSE_FILE" -w '%{http_code}' \
  88. -X POST "http://127.0.0.1:${PORT}${path}" \
  89. -H "Content-Type: application/json" \
  90. -d "$data")
  91. HTTP_BODY=$(cat "$HTTP_SSE_FILE")
  92. rm -f "$HTTP_SSE_FILE"
  93. }
  94. assert_status() {
  95. local expected="$1" label="$2"
  96. if [[ "$HTTP_STATUS" == "$expected" ]]; then
  97. pass "$label (status=$HTTP_STATUS)"
  98. else
  99. fail "$label (expected=$expected, got=$HTTP_STATUS)"
  100. echo " body: $HTTP_BODY"
  101. fi
  102. }
  103. assert_json_field() {
  104. local field="$1" label="$2"
  105. if echo "$HTTP_BODY" | python3 -c "import sys,json; d=json.load(sys.stdin); assert '$field' in d" 2>/dev/null; then
  106. pass "$label (field '$field' exists)"
  107. else
  108. fail "$label (field '$field' missing in response)"
  109. echo " body: $HTTP_BODY"
  110. fi
  111. }
  112. assert_json_value() {
  113. local field="$1" expected="$2" label="$3"
  114. local actual
  115. actual=$(echo "$HTTP_BODY" | python3 -c "import sys,json; print(json.load(sys.stdin)['$field'])" 2>/dev/null || echo "")
  116. if [[ "$actual" == "$expected" ]]; then
  117. pass "$label ($field='$actual')"
  118. else
  119. fail "$label (expected $field='$expected', got='$actual')"
  120. fi
  121. }
  122. assert_json_nonempty() {
  123. local field="$1" label="$2"
  124. local val
  125. val=$(echo "$HTTP_BODY" | python3 -c "import sys,json; v=json.load(sys.stdin)['$field']; assert len(str(v))>0; print(v)" 2>/dev/null || echo "")
  126. if [[ -n "$val" ]]; then
  127. pass "$label ($field is non-empty)"
  128. else
  129. fail "$label ($field is empty or missing)"
  130. echo " body: $HTTP_BODY"
  131. fi
  132. }
  133. # Patch port number in extracted source code (8080 -> test port)
  134. patch_port() {
  135. sed "s/127\.0\.0\.1\", 8080/127.0.0.1\", ${PORT}/g; s/127\.0\.0\.1:8080/127.0.0.1:${PORT}/g"
  136. }
  137. # Patch model path in extracted source code
  138. patch_model() {
  139. sed "s|models/gemma-2-2b-it-Q4_K_M.gguf|models/${MODEL_NAME}|g"
  140. }
  141. # =============================================================================
  142. # Ch1: Skeleton Server
  143. # =============================================================================
  144. test_ch1() {
  145. log "Ch1: Project Setup & Skeleton Server"
  146. local APP_DIR="$WORKDIR/translate-app"
  147. mkdir -p "$APP_DIR/src" "$APP_DIR/models"
  148. cd "$APP_DIR"
  149. # Copy httplib.h from project root (test current version)
  150. cp "$PROJECT_ROOT/httplib.h" .
  151. # Download json.hpp into nlohmann/ directory to match #include <nlohmann/json.hpp>
  152. mkdir -p nlohmann
  153. curl -sL -o nlohmann/json.hpp \
  154. https://github.com/nlohmann/json/releases/latest/download/json.hpp
  155. # CMakeLists.txt — ch1 doesn't need llama.cpp, so use a minimal version
  156. # (the doc's cmake includes llama.cpp which isn't cloned yet in ch1)
  157. cat > CMakeLists.txt << 'CMAKE_EOF'
  158. cmake_minimum_required(VERSION 3.16)
  159. project(translate-server LANGUAGES CXX)
  160. set(CMAKE_CXX_STANDARD 17)
  161. add_executable(translate-server src/main.cpp)
  162. target_include_directories(translate-server PRIVATE ${CMAKE_SOURCE_DIR})
  163. CMAKE_EOF
  164. # Extract main.cpp from ch1 doc and patch port
  165. extract_code "$DOCS_DIR/ch01-setup.md" "main.cpp" | patch_port > src/main.cpp
  166. # Build
  167. log "Ch1: Building..."
  168. cmake -B build -DCMAKE_BUILD_TYPE=Release 2>&1 | tail -1
  169. cmake --build build -j 2>&1 | tail -3
  170. # Start server
  171. ./build/translate-server &
  172. SERVER_PID=$!
  173. wait_for_server
  174. # Tests
  175. http_request POST /translate '{"text":"hello","target_lang":"ja"}'
  176. assert_status 200 "Ch1 POST /translate"
  177. assert_json_value translation "TODO" "Ch1 POST /translate returns TODO"
  178. http_request GET /models
  179. assert_status 200 "Ch1 GET /models"
  180. assert_json_field models "Ch1 GET /models"
  181. http_request POST /models/select '{"model":"test"}'
  182. assert_status 200 "Ch1 POST /models/select"
  183. assert_json_value status "TODO" "Ch1 POST /models/select returns TODO"
  184. stop_server
  185. log "Ch1: Done"
  186. }
  187. # =============================================================================
  188. # Ch2: REST API with llama.cpp
  189. # =============================================================================
  190. test_ch2() {
  191. log "Ch2: REST API with llama.cpp"
  192. local APP_DIR="$WORKDIR/translate-app"
  193. cd "$APP_DIR"
  194. # Clone llama.cpp
  195. if [[ ! -d llama.cpp ]]; then
  196. log "Ch2: Cloning llama.cpp..."
  197. git clone --depth 1 https://github.com/ggml-org/llama.cpp.git 2>&1 | tail -1
  198. fi
  199. # Download cpp-llamalib.h
  200. if [[ ! -f cpp-llamalib.h ]]; then
  201. curl -sL -o cpp-llamalib.h \
  202. https://raw.githubusercontent.com/yhirose/cpp-llamalib/main/cpp-llamalib.h
  203. fi
  204. # Download model
  205. if [[ ! -f "models/$MODEL_NAME" ]]; then
  206. log "Ch2: Downloading model ${MODEL_NAME} (~1.6GB)..."
  207. curl -L -o "models/$MODEL_NAME" "$MODEL_URL"
  208. fi
  209. # CMakeLists.txt from ch1 doc (includes llama.cpp)
  210. extract_code "$DOCS_DIR/ch01-setup.md" "CMakeLists.txt" > CMakeLists.txt
  211. # Extract main.cpp from ch2 doc and patch port + model path
  212. extract_code "$DOCS_DIR/ch02-rest-api.md" "main.cpp" | patch_port | patch_model > src/main.cpp
  213. # Build (clean rebuild needed — cmake config changed)
  214. log "Ch2: Building (this may take a while for llama.cpp)..."
  215. rm -rf build
  216. cmake -B build -DCMAKE_BUILD_TYPE=Release 2>&1 | tail -1
  217. cmake --build build -j 2>&1 | tail -3
  218. # Start server
  219. ./build/translate-server &
  220. SERVER_PID=$!
  221. wait_for_server
  222. # Tests — normal request
  223. http_request POST /translate \
  224. '{"text":"I had a great time visiting Tokyo last spring. The cherry blossoms were beautiful.","target_lang":"ja"}'
  225. assert_status 200 "Ch2 POST /translate normal"
  226. assert_json_nonempty translation "Ch2 POST /translate has translation"
  227. # Tests — invalid JSON
  228. http_request POST /translate 'not json'
  229. assert_status 400 "Ch2 POST /translate invalid JSON"
  230. # Tests — missing text
  231. http_request POST /translate '{"target_lang":"ja"}'
  232. assert_status 400 "Ch2 POST /translate missing text"
  233. # Tests — empty text
  234. http_request POST /translate '{"text":""}'
  235. assert_status 400 "Ch2 POST /translate empty text"
  236. stop_server
  237. log "Ch2: Done"
  238. }
  239. # =============================================================================
  240. # Ch3: SSE Streaming
  241. # =============================================================================
  242. test_ch3() {
  243. log "Ch3: SSE Streaming"
  244. local APP_DIR="$WORKDIR/translate-app"
  245. cd "$APP_DIR"
  246. # Extract main.cpp from ch3 doc and patch port + model path
  247. extract_code "$DOCS_DIR/ch03-sse-streaming.md" "main.cpp" | patch_port | patch_model > src/main.cpp
  248. # Build (incremental — only main.cpp changed)
  249. log "Ch3: Building..."
  250. cmake --build build -j 2>&1 | tail -3
  251. # Start server
  252. ./build/translate-server &
  253. SERVER_PID=$!
  254. wait_for_server
  255. # Tests — /translate still works
  256. http_request POST /translate \
  257. '{"text":"Hello world","target_lang":"ja"}'
  258. assert_status 200 "Ch3 POST /translate still works"
  259. # Tests — SSE streaming
  260. http_sse /translate/stream \
  261. '{"text":"I had a great time visiting Tokyo last spring. The cherry blossoms were beautiful.","target_lang":"ja"}'
  262. assert_status 200 "Ch3 POST /translate/stream status"
  263. # Check SSE format: has data: lines and ends with [DONE]
  264. local data_lines
  265. data_lines=$(echo "$HTTP_BODY" | grep -c '^data: ' || true)
  266. if [[ $data_lines -ge 2 ]]; then
  267. pass "Ch3 SSE has multiple data: lines ($data_lines)"
  268. else
  269. fail "Ch3 SSE expected multiple data: lines, got $data_lines"
  270. echo " body: $HTTP_BODY"
  271. fi
  272. if echo "$HTTP_BODY" | grep -q 'data: \[DONE\]'; then
  273. pass "Ch3 SSE ends with data: [DONE]"
  274. else
  275. fail "Ch3 SSE missing data: [DONE]"
  276. echo " body: $HTTP_BODY"
  277. fi
  278. # Tests — SSE invalid JSON
  279. http_sse /translate/stream 'not json'
  280. assert_status 400 "Ch3 POST /translate/stream invalid JSON"
  281. stop_server
  282. log "Ch3: Done"
  283. }
  284. # =============================================================================
  285. # Ch4: Model Management
  286. # =============================================================================
  287. test_ch4() {
  288. log "Ch4: Model Management"
  289. local APP_DIR="$WORKDIR/translate-app"
  290. cd "$APP_DIR"
  291. # Ch4+ uses ~/.translate-app/models/ — symlink model there
  292. local MODELS_HOME="$HOME/.translate-app/models"
  293. mkdir -p "$MODELS_HOME"
  294. ln -sf "$APP_DIR/models/$MODEL_NAME" "$MODELS_HOME/$MODEL_NAME"
  295. # CMakeLists.txt from ch4 (adds OpenSSL)
  296. extract_code "$DOCS_DIR/ch04-model-management.md" "CMakeLists.txt" > CMakeLists.txt
  297. # Extract main.cpp from ch4 doc
  298. extract_code "$DOCS_DIR/ch04-model-management.md" "main.cpp" | patch_port > src/main.cpp
  299. # Build (reconfigure for OpenSSL, incremental — reuses llama.cpp objects)
  300. log "Ch4: Building..."
  301. cmake -B build -DCMAKE_BUILD_TYPE=Release 2>&1 | tail -1
  302. cmake --build build -j 2>&1 | tail -3
  303. # Start server
  304. ./build/translate-server &
  305. SERVER_PID=$!
  306. wait_for_server
  307. # Tests — GET /models
  308. http_request GET /models
  309. assert_status 200 "Ch4 GET /models"
  310. assert_json_field models "Ch4 GET /models has models array"
  311. # デフォルトモデルがdownloaded+selectedであること
  312. local selected
  313. selected=$(echo "$HTTP_BODY" | python3 -c "
  314. import sys, json
  315. models = json.load(sys.stdin)['models']
  316. sel = [m for m in models if m['selected']]
  317. print(sel[0]['downloaded'] if sel else '')
  318. " 2>/dev/null || echo "")
  319. if [[ "$selected" == "True" ]]; then
  320. pass "Ch4 GET /models default model is downloaded and selected"
  321. else
  322. fail "Ch4 GET /models default model state unexpected"
  323. echo " body: $HTTP_BODY"
  324. fi
  325. # Tests — POST /models/select with already-downloaded model (SSE)
  326. http_sse /models/select '{"model": "gemma-2-2b-it"}'
  327. assert_status 200 "Ch4 POST /models/select already downloaded"
  328. if echo "$HTTP_BODY" | grep -q '"ready"'; then
  329. pass "Ch4 POST /models/select returns ready"
  330. else
  331. fail "Ch4 POST /models/select missing ready status"
  332. echo " body: $HTTP_BODY"
  333. fi
  334. # Tests — POST /models/select unknown model
  335. http_request POST /models/select '{"model": "nonexistent"}'
  336. assert_status 404 "Ch4 POST /models/select unknown model"
  337. # Tests — POST /models/select missing model field
  338. http_request POST /models/select '{"foo": "bar"}'
  339. assert_status 400 "Ch4 POST /models/select missing model field"
  340. # Tests — /translate still works after model select
  341. http_request POST /translate '{"text": "Hello", "target_lang": "ja"}'
  342. assert_status 200 "Ch4 POST /translate still works"
  343. assert_json_nonempty translation "Ch4 POST /translate has translation"
  344. # Tests — switch model via symlink (avoids downloading a second model)
  345. # Place a symlink so the server sees Llama-3.1-8B-Instruct as "downloaded"
  346. ln -sf "$MODELS_HOME/$MODEL_NAME" "$MODELS_HOME/Meta-Llama-3.1-8B-Instruct-Q4_K_M.gguf"
  347. http_sse /models/select '{"model": "Llama-3.1-8B-Instruct"}'
  348. assert_status 200 "Ch4 POST /models/select switch model"
  349. if echo "$HTTP_BODY" | grep -q '"ready"'; then
  350. pass "Ch4 model switch returns ready"
  351. else
  352. fail "Ch4 model switch missing ready"
  353. echo " body: $HTTP_BODY"
  354. fi
  355. # Translate with the switched model
  356. http_request POST /translate \
  357. '{"text": "The weather is nice today.", "target_lang": "ja"}'
  358. assert_status 200 "Ch4 POST /translate after model switch"
  359. assert_json_nonempty translation "Ch4 POST /translate switched model has translation"
  360. # Verify model list reflects the switch
  361. http_request GET /models
  362. local new_selected
  363. new_selected=$(echo "$HTTP_BODY" | python3 -c "
  364. import sys, json
  365. models = json.load(sys.stdin)['models']
  366. sel = [m for m in models if m['selected']]
  367. print(sel[0]['name'] if sel else '')
  368. " 2>/dev/null || echo "")
  369. if [[ "$new_selected" == "Llama-3.1-8B-Instruct" ]]; then
  370. pass "Ch4 GET /models reflects model switch"
  371. else
  372. fail "Ch4 GET /models expected Llama-3.1-8B-Instruct selected, got '$new_selected'"
  373. fi
  374. stop_server
  375. log "Ch4: Done"
  376. }
  377. # =============================================================================
  378. # Ch5: Web UI (browser tests via geckodriver + webdriver.h)
  379. # =============================================================================
  380. start_geckodriver() {
  381. geckodriver --port "$GECKODRIVER_PORT" &>/dev/null &
  382. GECKODRIVER_PID=$!
  383. # Wait for geckodriver to be ready
  384. local i=0
  385. while ! curl -s -o /dev/null "http://127.0.0.1:${GECKODRIVER_PORT}/status" 2>/dev/null; do
  386. sleep 0.5
  387. i=$((i + 1))
  388. if [[ $i -ge 20 ]]; then
  389. fail "geckodriver did not start within 10s"
  390. return 1
  391. fi
  392. done
  393. }
  394. stop_geckodriver() {
  395. if [[ -n "$GECKODRIVER_PID" ]]; then
  396. kill "$GECKODRIVER_PID" 2>/dev/null || true
  397. wait "$GECKODRIVER_PID" 2>/dev/null || true
  398. GECKODRIVER_PID=""
  399. fi
  400. }
  401. test_ch5() {
  402. log "Ch5: Web UI (browser tests)"
  403. # Check for geckodriver
  404. if ! command -v geckodriver &>/dev/null; then
  405. log "Ch5: Skipping browser tests (geckodriver not found)"
  406. log "Ch5: Install with: brew install geckodriver"
  407. return 0
  408. fi
  409. local APP_DIR="$WORKDIR/translate-app"
  410. cd "$APP_DIR"
  411. # Extract source files from ch05
  412. extract_code "$DOCS_DIR/ch05-web-ui.md" "main.cpp" \
  413. | patch_port > src/main.cpp
  414. mkdir -p public
  415. extract_code "$DOCS_DIR/ch05-web-ui.md" "index.html" > public/index.html
  416. extract_code "$DOCS_DIR/ch05-web-ui.md" "style.css" > public/style.css
  417. extract_code "$DOCS_DIR/ch05-web-ui.md" "script.js" > public/script.js
  418. # Build (incremental — only main.cpp changed)
  419. log "Ch5: Building server..."
  420. cmake --build build -j 2>&1 | tail -3
  421. # Build browser test program
  422. log "Ch5: Building browser test..."
  423. g++ -std=c++17 \
  424. -I"$APP_DIR" \
  425. -I"$SCRIPT_DIR" \
  426. -o "$APP_DIR/build/test_webui" \
  427. "$SCRIPT_DIR/test_webui.cpp" \
  428. -pthread
  429. # Start server
  430. ./build/translate-server &
  431. SERVER_PID=$!
  432. wait_for_server
  433. # Start geckodriver
  434. start_geckodriver
  435. # Run browser tests
  436. log "Ch5: Running browser tests..."
  437. local test_exit=0
  438. "$APP_DIR/build/test_webui" "$PORT" || test_exit=$?
  439. # Parse pass/fail from test output and add to totals
  440. # (test_webui prints its own pass/fail, but we track via exit code)
  441. if [[ $test_exit -ne 0 ]]; then
  442. fail "Ch5 browser tests had failures"
  443. else
  444. pass "Ch5 browser tests all passed"
  445. fi
  446. stop_geckodriver
  447. stop_server
  448. log "Ch5: Done"
  449. }
  450. # =============================================================================
  451. # Main
  452. # =============================================================================
  453. log "LLM App Tutorial E2E Test"
  454. log "Working directory: $WORKDIR"
  455. echo ""
  456. test_ch1
  457. echo ""
  458. test_ch2
  459. echo ""
  460. test_ch3
  461. echo ""
  462. test_ch4
  463. echo ""
  464. test_ch5
  465. log "Results: $PASS_COUNT passed, $FAIL_COUNT failed"
  466. if [[ $FAIL_COUNT -gt 0 ]]; then
  467. exit 1
  468. fi