Gemini Media Recognition

Generate content (Gemini)

curl --request POST \
  --url https://api.dgrid.ai/v1/models/{model}:generateContent \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "contents": [
    {
      "role": "user",
      "parts": [
        {
          "text": "Hello from DGrid."
        }
      ]
    }
  ]
}
'

import requests

url = "https://api.dgrid.ai/v1/models/{model}:generateContent"

payload = { "contents": [
        {
            "role": "user",
            "parts": [{ "text": "Hello from DGrid." }]
        }
    ] }
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({contents: [{role: 'user', parts: [{text: 'Hello from DGrid.'}]}]})
};

fetch('https://api.dgrid.ai/v1/models/{model}:generateContent', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.dgrid.ai/v1/models/{model}:generateContent"

	payload := strings.NewReader("{\n  \"contents\": [\n    {\n      \"role\": \"user\",\n      \"parts\": [\n        {\n          \"text\": \"Hello from DGrid.\"\n        }\n      ]\n    }\n  ]\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.dgrid.ai/v1/models/{model}:generateContent")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"contents\": [\n    {\n      \"role\": \"user\",\n      \"parts\": [\n        {\n          \"text\": \"Hello from DGrid.\"\n        }\n      ]\n    }\n  ]\n}")
  .asString();

{
  "candidates": [
    {
      "content": {
        "role": "<string>",
        "parts": [
          {}
        ]
      },
      "finishReason": "<string>",
      "safetyRatings": [
        {}
      ]
    }
  ],
  "usageMetadata": {
    "promptTokenCount": 123,
    "candidatesTokenCount": 123,
    "totalTokenCount": 123
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>",
    "param": "<string>",
    "code": "<string>"
  }
}

POST

models

{model}

:generateContent

Generate content (Gemini)

curl --request POST \
  --url https://api.dgrid.ai/v1/models/{model}:generateContent \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: application/json' \
  --data '
{
  "contents": [
    {
      "role": "user",
      "parts": [
        {
          "text": "Hello from DGrid."
        }
      ]
    }
  ]
}
'

import requests

url = "https://api.dgrid.ai/v1/models/{model}:generateContent"

payload = { "contents": [
        {
            "role": "user",
            "parts": [{ "text": "Hello from DGrid." }]
        }
    ] }
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

const options = {
  method: 'POST',
  headers: {Authorization: 'Bearer <token>', 'Content-Type': 'application/json'},
  body: JSON.stringify({contents: [{role: 'user', parts: [{text: 'Hello from DGrid.'}]}]})
};

fetch('https://api.dgrid.ai/v1/models/{model}:generateContent', options)
  .then(res => res.json())
  .then(res => console.log(res))
  .catch(err => console.error(err));

package main

import (
	"fmt"
	"strings"
	"net/http"
	"io"
)

func main() {

	url := "https://api.dgrid.ai/v1/models/{model}:generateContent"

	payload := strings.NewReader("{\n  \"contents\": [\n    {\n      \"role\": \"user\",\n      \"parts\": [\n        {\n          \"text\": \"Hello from DGrid.\"\n        }\n      ]\n    }\n  ]\n}")

	req, _ := http.NewRequest("POST", url, payload)

	req.Header.Add("Authorization", "Bearer <token>")
	req.Header.Add("Content-Type", "application/json")

	res, _ := http.DefaultClient.Do(req)

	defer res.Body.Close()
	body, _ := io.ReadAll(res.Body)

	fmt.Println(string(body))

}

HttpResponse<String> response = Unirest.post("https://api.dgrid.ai/v1/models/{model}:generateContent")
  .header("Authorization", "Bearer <token>")
  .header("Content-Type", "application/json")
  .body("{\n  \"contents\": [\n    {\n      \"role\": \"user\",\n      \"parts\": [\n        {\n          \"text\": \"Hello from DGrid.\"\n        }\n      ]\n    }\n  ]\n}")
  .asString();

{
  "candidates": [
    {
      "content": {
        "role": "<string>",
        "parts": [
          {}
        ]
      },
      "finishReason": "<string>",
      "safetyRatings": [
        {}
      ]
    }
  ],
  "usageMetadata": {
    "promptTokenCount": 123,
    "candidatesTokenCount": 123,
    "totalTokenCount": 123
  }
}

{
  "error": {
    "message": "<string>",
    "type": "<string>",
    "param": "<string>",
    "code": "<string>"
  }
}

This page uses the same generateContent operation as Generate content (Gemini), with the playground above pre-filled for plain text chat. The notes below describe the Gemini-native multimodal fields you can add to contents[].parts to analyze images, audio, video, or mixed media in a single request.

Each part can carry inline data (base64-encoded bytes plus a MIME type) alongside text instructions, letting the model reason across modalities in one call.

Gemini-native request fields

The generic contents and generationConfig fields shown in the playground accept the following nested shape for multimodal recognition:

Field	Type	Required	Description
`contents[].role`	string	No	Role of the turn, e.g. `user`.
`contents[].parts`	array	Yes	Ordered list of content parts (text and/or inline media).
`contents[].parts[].text`	string	No	Text instruction or question for the model.
`contents[].parts[].inlineData`	object	No	Inline media payload for image, audio, or video understanding.
`contents[].parts[].inlineData.mimeType`	string	No	MIME type of the inline data, e.g. `image/jpeg`, `audio/mp3`, `video/mp4`.
`contents[].parts[].inlineData.data`	string	No	Base64-encoded media bytes.

You can mix multiple parts in a single turn — for example a text part with an instruction followed by one or more inlineData parts containing the media to analyze.

Example: analyzing an image

{
  "contents": [
    {
      "role": "user",
      "parts": [
        { "text": "Describe what is happening in this image." },
        {
          "inlineData": {
            "mimeType": "image/jpeg",
            "data": "<base64-encoded-image-bytes>"
          }
        }
      ]
    }
  ]
}

Response fields

The response follows the standard generateContent shape. The fields most relevant to media recognition are:

array

Candidate responses returned by the model.

Show candidate properties

object

Generated content object.

Show content properties

string

Role returned in the generated content block, typically model.

array

Returned content parts, typically text describing the analyzed media.

string

Finish reason string, e.g. STOP.

array

Safety evaluation results.

object

Token accounting metadata, including promptTokenCount, candidatesTokenCount, and totalTokenCount. Inline media (images, audio, video) consumes prompt tokens in addition to any text parts.

Example response

200

{
  "candidates": [
    {
      "content": {
        "role": "model",
        "parts": [
          { "text": "The image shows a golden retriever sitting on a grassy lawn." }
        ]
      },
      "finishReason": "STOP",
      "safetyRatings": []
    }
  ],
  "usageMetadata": {
    "promptTokenCount": 264,
    "candidatesTokenCount": 18,
    "totalTokenCount": 282
  }
}

Authorizations

Authorization

string

header

required

Your DGrid API key. All endpoints use Authorization: Bearer <DGRID_API_KEY>.

Path Parameters

model

string

required

Target model ID, such as gemini-1.5-pro.

Body

application/json

contents

object[]

Input content array with role and parts.

Show child attributes

generationConfig

object

Generation configuration.

Show child attributes

Response

Generated content candidates.

candidates

object[]

Candidate responses returned by the model.

Show child attributes

usageMetadata

object

Token accounting metadata.

Show child attributes

Generate content (Gemini)

Create completion

GETTING STARTED

MODEL API

MANAGEMENT API KEYS

X402 API

Gemini Media Recognition

Gemini-native request fields

Example: analyzing an image

Response fields

Example response

Authorizations

Path Parameters

Body

Response

​Gemini-native request fields

​Example: analyzing an image

​Response fields

​Example response

Authorizations

Path Parameters

Body

Response

Gemini-native request fields

Example: analyzing an image

Response fields

Example response