Streaming
curl -N -X POST https://api.moondream.ai/v1/query \
-H 'Content-Type: application/json' \
-H 'X-Moondream-Auth: YOUR_API_KEY' \
-d '{
"image_url": "",
"question": "What is in this image?",
"stream": true
}'
data: {"text": "The"}
data: {"text": " image"}
▊Streaming lets you receive AI responses as they're being generated, word-by-word, instead of waiting for the complete answer. This creates a more responsive experience for your users. Streaming is available for the query and caption endpoints.
Using with the SDK
- Python
- Node.js
View Python SDK Documentation →
Query
import moondream as md
from PIL import Image
# Initialize with your API key
model = md.vl(api_key="YOUR_API_KEY")
# Load an image
image = Image.open("path/to/image.jpg")
# Stream a query response
for chunk in model.query(image, question="What is in this image?", stream=True)["answer"]:
print(chunk, end="", flush=True)
Caption
import moondream as md
from PIL import Image
# Initialize with your API key
model = md.vl(api_key="YOUR_API_KEY")
# Load an image
image = Image.open("path/to/image.jpg")
# Stream a caption
for chunk in model.caption(image, stream=True)["caption"]:
print(chunk, end="", flush=True)
View Node.js SDK Documentation →
Query
import { vl } from 'moondream';
import fs from 'fs';
// Initialize with your API key
const model = new vl({ apiKey: 'YOUR_API_KEY' });
// Load an image
const image = fs.readFileSync('path/to/image.jpg');
// Stream a query response
const stream = await model.query({
image: image,
question: 'What is in this image?',
stream: true
});
for await (const chunk of stream.answer) {
process.stdout.write(chunk);
}
Caption
import { vl } from 'moondream';
import fs from 'fs';
// Initialize with your API key
const model = new vl({ apiKey: 'YOUR_API_KEY' });
// Load an image
const image = fs.readFileSync('path/to/image.jpg');
// Stream a caption
const stream = await model.caption({
image: image,
length: 'normal',
stream: true
});
for await (const chunk of stream.caption) {
process.stdout.write(chunk);
}