128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
|
# File 'lib/toy/serve/openai/handlers.rb', line 128
def handle(req, res)
res.["Content-Type"] = "text/html; charset=utf-8"
"<!doctype html><html><head><title>toy openai-compat (IDs only)</title></head>" +
"<body><h1>toy openai-compat API (ID-only)</h1>" +
"<p>Model: <code>" + STATE.model_name + "</code> via direct GGUF→FFI loader.</p>" +
"<p>Tokenize client-side; this server speaks integer token IDs only. " +
"Run <code>prep/qwen25_tokens.py encode \"...\"</code> to get IDs.</p>" +
"<p>Endpoints:</p><ul>" +
"<li><code>POST /v1/completions</code> — body <code>{\"prompt\":[int,...],\"max_tokens\":N}</code></li>" +
"<li><code>POST /v1/chat/completions</code> — 501 (tokenizer required)</li>" +
"<li><code>POST /v1/embeddings</code> — body <code>{\"input\":[int,...]}</code> → mean-pooled vector</li>" +
"<li><code>GET /v1/models</code></li>" +
"<li><code>GET /health</code></li>" +
"</ul></body></html>"
end
|