digitalocean · SSharma-10 · May 5, 2026 · Apr 30, 2026 · May 1, 2026 · May 5, 2026
diff --git a/specification/resources/inference/examples/curl/inference_create_batch.yml b/specification/resources/inference/examples/curl/inference_create_batch.yml
@@ -1,6 +1,6 @@
 lang: cURL
 source: |-
-  # OpenAI provider - Chat Completions
+  # OpenAI provider — endpoint required (/v1/responses or /v1/chat/completions)
   curl -sS -X POST "https://inference.do-ai.run/v1/batches" \
     -H "Authorization: Bearer $DIGITALOCEAN_TOKEN" \
     -H "Content-Type: application/json" \
@@ -12,14 +12,13 @@ source: |-
       "request_id": "c7e3ad1e-20c3-4e47-9bf2-6f2a4d6a2f11"
     }'
 
-  # Anthropic provider - Messages
+  # Anthropic provider — DO NOT send endpoint
   curl -sS -X POST "https://inference.do-ai.run/v1/batches" \
     -H "Authorization: Bearer $DIGITALOCEAN_TOKEN" \
     -H "Content-Type: application/json" \
     -d '{
       "file_id": "a1b2c3d4-e5f6-4789-90ab-cdef12345678",
       "provider": "anthropic",
-      "endpoint": "/v1/messages",
       "completion_window": "24h",
       "request_id": "2f1a7d9e-8c03-4d2c-9b7e-6f8e2b1a4c77"
     }'
diff --git a/specification/resources/inference/examples/curl/inference_upload_batch_file.yml b/specification/resources/inference/examples/curl/inference_upload_batch_file.yml
@@ -2,6 +2,12 @@ lang: cURL
 source: |-
   # UPLOAD_URL is the exact upload_url returned by POST /v1/batches/files.
   # Use it verbatim; do not modify the host, path, or query string.
+  #
+  # Send the raw JSONL bytes with --data-binary so line endings and UTF-8
+  # are preserved. The presigned URL is signature-sensitive: prefer
+  # application/octet-stream (or omit Content-Type entirely) — a custom
+  # value such as application/jsonl can break signature matching unless
+  # the URL was signed for that exact header.
   curl -X PUT "$UPLOAD_URL" \
-    -H "Content-Type: application/jsonl" \
-    --data-binary "@eval_prompts_v1.jsonl"
+    -H "Content-Type: application/octet-stream" \
+    --data-binary "@batch_requests.jsonl"
diff --git a/specification/resources/inference/examples/dots/inference_cancel_batch.yml b/specification/resources/inference/examples/dots/inference_cancel_batch.yml
@@ -0,0 +1,13 @@
+lang: JavaScript
+source: |-
+  import { InferenceClient } from "@digitalocean/dots";
+
+  const client = new InferenceClient({
+      apiKey: process.env.DIGITALOCEAN_TOKEN,
+  });
+
+  const result = await client.batches.cancel(process.env.BATCH_ID);
+
+  console.log("batch_id:    ", result.batch_id);
+  console.log("status:      ", result.status);
+  console.log("cancelled_at:", result.cancelled_at);
diff --git a/specification/resources/inference/examples/dots/inference_create_batch.yml b/specification/resources/inference/examples/dots/inference_create_batch.yml
@@ -0,0 +1,19 @@
+lang: JavaScript
+source: |-
+  import { randomUUID } from "node:crypto";
+  import { InferenceClient } from "@digitalocean/dots";
+
+  const client = new InferenceClient({
+      apiKey: process.env.DIGITALOCEAN_TOKEN,
+  });
+
+  const batch = await client.batches.create({
+      file_id: process.env.BATCH_INPUT_FILE_ID,
+      provider: "openai",
+      endpoint: "/v1/chat/completions",
+      completion_window: "24h",
+      request_id: randomUUID(),
+  });
+
+  console.log("batch_id:", batch.batch_id);
+  console.log("status:  ", batch.status);
diff --git a/specification/resources/inference/examples/dots/inference_create_batch_file.yml b/specification/resources/inference/examples/dots/inference_create_batch_file.yml
@@ -0,0 +1,14 @@
+lang: JavaScript
+source: |-
+  import { InferenceClient } from "@digitalocean/dots";
+
+  const client = new InferenceClient({
+      apiKey: process.env.DIGITALOCEAN_TOKEN,
+  });
+
+  const intent = await client.files.create({
+      file_name: "batch_requests.jsonl",
+  });
+
+  console.log("file_id:   ", intent.file_id);
+  console.log("upload_url:", intent.upload_url);
diff --git a/specification/resources/inference/examples/dots/inference_get_batch.yml b/specification/resources/inference/examples/dots/inference_get_batch.yml
@@ -0,0 +1,14 @@
+lang: JavaScript
+source: |-
+  import { InferenceClient } from "@digitalocean/dots";
+
+  const client = new InferenceClient({
+      apiKey: process.env.DIGITALOCEAN_TOKEN,
+  });
+
+  const batch = await client.batches.retrieve(process.env.BATCH_ID);
+
+  console.log("batch_id:      ", batch.batch_id);
+  console.log("status:        ", batch.status);
+  console.log("request_counts:", batch.request_counts);
+  console.log("output_file_id:", batch.output_file_id);
diff --git a/specification/resources/inference/examples/dots/inference_get_batch_results.yml b/specification/resources/inference/examples/dots/inference_get_batch_results.yml
@@ -0,0 +1,22 @@
+lang: JavaScript
+source: |-
+  import { InferenceClient } from "@digitalocean/dots";
+
+  const client = new InferenceClient({
+      apiKey: process.env.DIGITALOCEAN_TOKEN,
+  });
+
+  const batchId = process.env.BATCH_ID;
+
+  // client.files.content resolves the result envelope and follows the
+  // presigned URL for you, returning the raw fetch Response.
+  const resp = await client.files.content(batchId);
+  if (!resp.ok) {
+      throw new Error(`results not ready: HTTP ${resp.status}`);
+  }
+
+  const body = await resp.text();
+  const lines = body.split("\n").filter(Boolean);
+
+  console.log(`got ${lines.length} line(s); first entry:`);
+  console.log(lines[0]);
diff --git a/specification/resources/inference/examples/dots/inference_list_batches.yml b/specification/resources/inference/examples/dots/inference_list_batches.yml
@@ -0,0 +1,16 @@
+lang: JavaScript
+source: |-
+  import { InferenceClient } from "@digitalocean/dots";
+
+  const client = new InferenceClient({
+      apiKey: process.env.DIGITALOCEAN_TOKEN,
+  });
+
+  const page = await client.batches.list({ limit: 20 });
+
+  for (const b of page.data ?? []) {
+      console.log(`${b.batch_id}\t${b.status}\t${b.created_at}`);
+  }
+
+  console.log("has_more:", page.has_more);
+  console.log("last_id: ", page.last_id);
diff --git a/specification/resources/inference/examples/dots/inference_upload_batch_file.yml b/specification/resources/inference/examples/dots/inference_upload_batch_file.yml
@@ -0,0 +1,32 @@
+lang: JavaScript
+source: |-
+  // Two-step upload flow:
+  //   1. Reserve a file_id + presigned upload_url via client.files.create.
+  //   2. PUT the raw JSONL bytes to upload_url.
+  //
+  // The presigned URL is short-lived (~15 minutes) and signature-sensitive —
+  // use it verbatim and prefer Content-Type application/octet-stream (or
+  // omit the header entirely). A custom value such as application/jsonl
+  // can break signature matching.
+  import { readFile } from "node:fs/promises";
+  import { InferenceClient } from "@digitalocean/dots";
+
+  const client = new InferenceClient({
+      apiKey: process.env.DIGITALOCEAN_TOKEN,
+  });
+
+  // Step 1: reserve the upload slot.
+  const intent = await client.files.create({ file_name: "batch_requests.jsonl" });
+
+  // Step 2: PUT the JSONL bytes to the presigned URL.
+  const body = await readFile("batch_requests.jsonl");
+  const res = await fetch(intent.upload_url, {
+      method: "PUT",
+      headers: { "Content-Type": "application/octet-stream" },
+      body,
+  });
+  if (!res.ok) {
+      throw new Error(`Upload failed: HTTP ${res.status} ${res.statusText}`);
+  }
+
+  console.log("uploaded file_id:", intent.file_id);
diff --git a/specification/resources/inference/examples/python/inference_cancel_batch.yml b/specification/resources/inference/examples/python/inference_cancel_batch.yml
@@ -0,0 +1,13 @@
+lang: Python
+source: |-
+  import os
+
+  from pydo import Client
+
+  client = Client(token=os.environ.get("DIGITALOCEAN_TOKEN"))
+
+  result = client.batches.cancel(os.environ["BATCH_ID"])
+
+  print("batch_id:    ", result.get("batch_id"))
+  print("status:      ", result.get("status"))
+  print("cancelled_at:", result.get("cancelled_at"))
diff --git a/specification/resources/inference/examples/python/inference_create_batch.yml b/specification/resources/inference/examples/python/inference_create_batch.yml
@@ -0,0 +1,19 @@
+lang: Python
+source: |-
+  import os
+  import uuid
+
+  from pydo import Client
+
+  client = Client(token=os.environ.get("DIGITALOCEAN_TOKEN"))
+
+  batch = client.batches.create(
+      file_id=os.environ["BATCH_INPUT_FILE_ID"],
+      provider="openai",
+      endpoint="/v1/chat/completions",
+      completion_window="24h",
+      request_id=str(uuid.uuid4()),
+  )
+
+  print("batch_id:", batch.get("batch_id"))
+  print("status:  ", batch.get("status"))
diff --git a/specification/resources/inference/examples/python/inference_create_batch_file.yml b/specification/resources/inference/examples/python/inference_create_batch_file.yml
@@ -0,0 +1,44 @@
+lang: Python
+source: |-
+  import json
+  import os
+  from pathlib import Path
+
+  from pydo import Client
+
+  client = Client(token=os.environ.get("DIGITALOCEAN_TOKEN"))
+
+  input_path = Path("batch_requests.jsonl")
+  requests = [
+      {
+          "custom_id": "q-1",
+          "method": "POST",
+          "url": "/v1/chat/completions",
+          "body": {
+              "model": "llama3.3-70b-instruct",
+              "messages": [
+                  {"role": "user", "content": "One fun fact about octopuses."}
+              ],
+              "max_tokens": 128,
+          },
+      },
+      {
+          "custom_id": "q-2",
+          "method": "POST",
+          "url": "/v1/chat/completions",
+          "body": {
+              "model": "llama3.3-70b-instruct",
+              "messages": [
+                  {"role": "user", "content": "One fun fact about sharks."}
+              ],
+              "max_tokens": 128,
+          },
+      },
+  ]
+  input_path.write_text("\n".join(json.dumps(r) for r in requests) + "\n")
+
+  uploaded = client.files.create(file=input_path, purpose="batch")
+
+  print("file_id: ", uploaded.file_id)
+  print("filename:", uploaded.filename)
+  print("bytes:   ", uploaded.bytes)
diff --git a/specification/resources/inference/examples/python/inference_get_batch.yml b/specification/resources/inference/examples/python/inference_get_batch.yml
@@ -0,0 +1,14 @@
+lang: Python
+source: |-
+  import os
+
+  from pydo import Client
+
+  client = Client(token=os.environ.get("DIGITALOCEAN_TOKEN"))
+
+  batch = client.batches.retrieve(os.environ["BATCH_ID"])
+
+  print("batch_id:      ", batch.get("batch_id"))
+  print("status:        ", batch.get("status"))
+  print("request_counts:", batch.get("request_counts"))
+  print("output_file_id:", batch.get("output_file_id"))
diff --git a/specification/resources/inference/examples/python/inference_get_batch_results.yml b/specification/resources/inference/examples/python/inference_get_batch_results.yml
@@ -0,0 +1,27 @@
+lang: Python
+source: |-
+  import os
+  from pathlib import Path
+
+  import requests
+  from pydo import Client
+
+  client = Client(token=os.environ.get("DIGITALOCEAN_TOKEN"))
+
+  batch_id = os.environ["BATCH_ID"]
+
+  links = client.batches.results.retrieve(batch_id)
+
+  if not links.get("result_available"):
+      print("results not ready yet; poll batch status and retry")
+      raise SystemExit(0)
+
+  resp = requests.get(links["output_file_url"], timeout=60)
+  resp.raise_for_status()
+
+  out = Path("batch_output.jsonl")
+  out.write_bytes(resp.content)
+
+  print("wrote:", out)
+  print("----- preview -----")
+  print(resp.text[:500])
diff --git a/specification/resources/inference/examples/python/inference_list_batches.yml b/specification/resources/inference/examples/python/inference_list_batches.yml
@@ -0,0 +1,15 @@
+lang: Python
+source: |-
+  import os
+
+  from pydo import Client
+
+  client = Client(token=os.environ.get("DIGITALOCEAN_TOKEN"))
+
+  resp = client.batches.list(limit=20)
+
+  for b in resp.get("data") or []:
+      print(f"{b.get('batch_id'):40}  {b.get('status'):12}  {b.get('created_at')}")
+
+  print("has_more:", resp.get("has_more"))
+  print("last_id: ", resp.get("last_id"))
diff --git a/specification/resources/inference/examples/python/inference_upload_batch_file.yml b/specification/resources/inference/examples/python/inference_upload_batch_file.yml
@@ -0,0 +1,36 @@
+lang: Python
+source: |-
+  # Two-step upload flow:
+  #   1. Reserve a file_id + presigned upload_url via client.batches.files.create.
+  #   2. PUT the raw JSONL bytes to upload_url.
+  #
+  # The presigned URL is short-lived (~15 minutes) and signature-sensitive —
+  # use it verbatim and prefer Content-Type application/octet-stream (or
+  # omit the header entirely). A custom value such as application/jsonl
+  # can break signature matching.
+  import os
+  from pathlib import Path
+
+  import requests
+  from pydo import Client
+
+  client = Client(token=os.environ.get("DIGITALOCEAN_TOKEN"))
+
+  input_path = Path("batch_requests.jsonl")
+
+  # Step 1: reserve the upload slot.
+  intent = client.batches.files.create(file_name=input_path.name)
+  upload_url = intent["upload_url"]
+  file_id = intent["file_id"]
+
+  # Step 2: PUT the JSONL bytes to the presigned URL.
+  with input_path.open("rb") as fh:
+      put = requests.put(
+          upload_url,
+          data=fh,
+          headers={"Content-Type": "application/octet-stream"},
+          timeout=60,
+      )
+  put.raise_for_status()
+
+  print("uploaded file_id:", file_id)
diff --git a/specification/resources/inference/inference_cancel_batch.yml b/specification/resources/inference/inference_cancel_batch.yml
@@ -4,7 +4,10 @@ description: >
   Requests cancellation of a batch job. The job transitions to `cancelling`
   and, once in-flight requests drain, to `cancelled`. Jobs already in a
   terminal state (`completed`, `failed`, `expired`, `cancelled`) cannot be
-  cancelled and return `409 Conflict`.
+  cancelled and return `409 Conflict`. Cancellation is also rejected with
+  `409 Conflict` while the job has not yet been submitted to the upstream
+  provider — there is nothing to cancel until the provider batch id is
+  assigned.
 
 
   Partial results produced before cancellation remain available via
@@ -54,5 +57,7 @@ responses:
     $ref: '../../shared/responses/unexpected_error.yml'
 x-codeSamples:
   - $ref: 'examples/curl/inference_cancel_batch.yml'
+  - $ref: 'examples/python/inference_cancel_batch.yml'
+  - $ref: 'examples/dots/inference_cancel_batch.yml'
 security:
   - inference_bearer_auth: []
diff --git a/specification/resources/inference/inference_create_batch.yml b/specification/resources/inference/inference_create_batch.yml
@@ -29,18 +29,17 @@ requestBody:
             endpoint: "/v1/chat/completions"
             completion_window: "24h"
             request_id: "c7e3ad1e-20c3-4e47-9bf2-6f2a4d6a2f11"
-        OpenAI Embeddings:
+        OpenAI Responses:
           value:
             file_id: "a1b2c3d4-e5f6-4789-90ab-cdef12345678"
             provider: "openai"
-            endpoint: "/v1/embeddings"
+            endpoint: "/v1/responses"
             completion_window: "24h"
             request_id: "9f7b9d4a-4e6c-4a27-8e35-1b0e4c5a9a12"
         Anthropic Messages:
           value:
             file_id: "a1b2c3d4-e5f6-4789-90ab-cdef12345678"
             provider: "anthropic"
-            endpoint: "/v1/messages"
             completion_window: "24h"
             request_id: "2f1a7d9e-8c03-4d2c-9b7e-6f8e2b1a4c77"
             metadata:
@@ -80,5 +79,7 @@ responses:
     $ref: '../../shared/responses/unexpected_error.yml'
 x-codeSamples:
   - $ref: 'examples/curl/inference_create_batch.yml'
+  - $ref: 'examples/python/inference_create_batch.yml'
+  - $ref: 'examples/dots/inference_create_batch.yml'
 security:
   - inference_bearer_auth: []