Skip to content

Commit 2cb6cf7

Browse files
committed
Use quantized base model
1 parent 19f20ec commit 2cb6cf7

File tree

3 files changed

+16
-8
lines changed

3 files changed

+16
-8
lines changed

.vscode/settings.json

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
{
2+
"biome.configurationPath": "./auth/biome.json",
3+
"biome.enabled": true,
4+
"biome.lsp.bin": "./auth/node_modules/.bin/biome",
5+
"editor.codeActionsOnSave": {
6+
"source.fixAll.biome": "explicit"
7+
}
8+
}

auth/index.ts

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,6 @@ import { env } from './env'
33
const SGLANG_URL = 'http://localhost:8000'
44

55
const server = Bun.serve({
6-
port: process.env.PORT || 3000,
76
async fetch(req) {
87
const url = new URL(req.url)
98

@@ -30,23 +29,24 @@ const server = Bun.serve({
3029

3130
// Forward to SGLang
3231
const response = await fetch(`${SGLANG_URL}${url.pathname}`, {
33-
method: req.method,
32+
body: req.method !== 'GET' ? await req.text() : null,
3433
headers: { 'content-type': 'application/json' },
35-
body: req.method !== 'GET' ? await req.text() : null
34+
method: req.method
3635
})
3736

3837
return new Response(response.body, {
39-
status: response.status,
40-
headers: response.headers
38+
headers: response.headers,
39+
status: response.status
4140
})
4241
} catch (error) {
4342
console.error(error)
4443
return Response.json(
45-
{ error: 'Internal Server Error', details: JSON.stringify(error) },
44+
{ details: JSON.stringify(error), error: 'Internal Server Error' },
4645
{ status: 500 }
4746
)
4847
}
49-
}
48+
},
49+
port: process.env.PORT || 3000
5050
})
5151

5252
console.log(`Auth server running on port ${server.port}`)

skypilot.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ num_nodes: 1
66
workdir: ./auth
77

88
envs:
9-
BASE_MODEL: Qwen/Qwen3-8B
9+
BASE_MODEL: Qwen/Qwen3-8B-AWQ
1010
HF_HUB_ENABLE_HF_TRANSFER: "1"
1111
CUDA_HOME: "/usr/local/cuda-12"
1212
LD_LIBRARY_PATH: "/usr/local/cuda-12/lib64:$LD_LIBRARY_PATH"

0 commit comments

Comments
 (0)