Gemini की Deep Research की सुविधा अब झलक के तौर पर उपलब्ध है. इसमें साथ मिलकर प्लान बनाने, विज़ुअलाइज़ेशन, एमसीपी के साथ काम करने की सुविधा वगैरह शामिल है.

Google uses AI technology to translate content into your preferred language. AI translations can contain errors.

Gemini की सोच-समझकर जवाब देने की क्षमता

Gemini 3 और 2.5 सीरीज़ के मॉडल, अंदरूनी "सोच-समझकर जवाब देने की प्रोसेस" का इस्तेमाल करते हैं. इससे, उनकी रीज़निंग और कई चरणों वाली प्लानिंग की क्षमता बेहतर होती है. इस वजह से, ये मॉडल कोडिंग, ऐडवांस लेवल की गणित, और डेटा विश्लेषण जैसे मुश्किल टास्क के लिए काफ़ी असरदार साबित होते हैं.

इस गाइड में, Gemini API का इस्तेमाल करके, Gemini की सोच-समझकर जवाब देने की क्षमता का इस्तेमाल करने का तरीका बताया गया है.

सोच-समझकर जवाब देने की क्षमता का इस्तेमाल करके कॉन्टेंट जनरेट करना

सोच-समझकर जवाब देने वाले मॉडल के साथ अनुरोध शुरू करना, कॉन्टेंट जनरेट करने के किसी अन्य अनुरोध की तरह ही होता है. मुख्य अंतर, model फ़ील्ड में सोच-समझकर जवाब देने की सुविधा वाले किसी मॉडल को तय करने की प्रोसेस में होता है. इसे, कॉन्टेंट जनरेट करने के इस उदाहरण में दिखाया गया है:

Python

from google import genai

client = genai.Client()
prompt = "Explain the concept of Occam's Razor and provide a simple, everyday example."
response = client.models.generate_content(
    model="gemini-3-flash-preview",
    contents=prompt
)

print(response.text)

JavaScript

import { GoogleGenAI } from "@google/genai";

const ai = new GoogleGenAI({});

async function main() {
  const prompt = "Explain the concept of Occam's Razor and provide a simple, everyday example.";

  const response = await ai.models.generateContent({
    model: "gemini-3-flash-preview",
    contents: prompt,
  });

  console.log(response.text);
}

main();

ऐप पर जाएं

package main

import (
  "context"
  "fmt"
  "log"
  "os"
  "google.golang.org/genai"
)

func main() {
  ctx := context.Background()
  client, err := genai.NewClient(ctx, nil)
  if err != nil {
      log.Fatal(err)
  }

  prompt := "Explain the concept of Occam's Razor and provide a simple, everyday example."
  model := "gemini-3-flash-preview"

  resp, _ := client.Models.GenerateContent(ctx, model, genai.Text(prompt), nil)

  fmt.Println(resp.Text())
}

REST

curl "https://generativelanguage.googleapis.com/v1beta/models/gemini-3-flash-preview:generateContent" \
 -H "x-goog-api-key: $GEMINI_API_KEY" \
 -H 'Content-Type: application/json' \
 -X POST \
 -d '{
   "contents": [
     {
       "parts": [
         {
           "text": "Explain the concept of Occam'\''s Razor and provide a simple, everyday example."
         }
       ]
     }
   ]
 }'
 ```

सोच-समझकर जवाब देने की प्रोसेस की खास जानकारी

सोच-समझकर जवाब देने की प्रोसेस की खास जानकारी, मॉडल की ओर से की गई रॉ थिंकिंग का संक्षिप्त वर्शन होती है. इससे, मॉडल की इंटरनल रीज़निंग प्रोसेस के बारे में अहम जानकारी मिलती है. ध्यान दें कि सोच-समझकर जवाब देने की प्रोसेस के लेवल और बजट, मॉडल की रॉ थिंकिंग पर लागू होते हैं. ये खास जानकारी पर लागू नहीं होते.

अनुरोध के कॉन्फ़िगरेशन में includeThoughts को true पर सेट करके, सोच-समझकर जवाब देने की प्रोसेस की खास जानकारी पाने की सुविधा चालू की जा सकती है. इसके बाद, response पैरामीटर के parts में जाकर, खास जानकारी ऐक्सेस की जा सकती है. साथ ही, thought बूलियन की जांच की जा सकती है.

यहां एक उदाहरण दिया गया है, जिसमें स्ट्रीमिंग के बिना, सोच-समझकर जवाब देने की प्रोसेस की खास जानकारी पाने की सुविधा चालू करने और उसे पाने का तरीका दिखाया गया है. इससे, जवाब के साथ, सोच-समझकर जवाब देने की प्रोसेस की एक खास जानकारी मिलती है:

Python

from google import genai
from google.genai import types

client = genai.Client()
prompt = "What is the sum of the first 50 prime numbers?"
response = client.models.generate_content(
  model="gemini-3-flash-preview",
  contents=prompt,
  config=types.GenerateContentConfig(
    thinking_config=types.ThinkingConfig(
      include_thoughts=True
    )
  )
)

for part in response.candidates[0].content.parts:
  if not part.text:
    continue
  if part.thought:
    print("Thought summary:")
    print(part.text)
    print()
  else:
    print("Answer:")
    print(part.text)
    print()

JavaScript

import { GoogleGenAI } from "@google/genai";

const ai = new GoogleGenAI({});

async function main() {
  const response = await ai.models.generateContent({
    model: "gemini-3-flash-preview",
    contents: "What is the sum of the first 50 prime numbers?",
    config: {
      thinkingConfig: {
        includeThoughts: true,
      },
    },
  });

  for (const part of response.candidates[0].content.parts) {
    if (!part.text) {
      continue;
    }
    else if (part.thought) {
      console.log("Thoughts summary:");
      console.log(part.text);
    }
    else {
      console.log("Answer:");
      console.log(part.text);
    }
  }
}

main();

ऐप पर जाएं

package main

import (
  "context"
  "fmt"
  "google.golang.org/genai"
  "os"
)

func main() {
  ctx := context.Background()
  client, err := genai.NewClient(ctx, nil)
  if err != nil {
      log.Fatal(err)
  }

  contents := genai.Text("What is the sum of the first 50 prime numbers?")
  model := "gemini-3-flash-preview"
  resp, _ := client.Models.GenerateContent(ctx, model, contents, &genai.GenerateContentConfig{
    ThinkingConfig: &genai.ThinkingConfig{
      IncludeThoughts: true,
    },
  })

  for _, part := range resp.Candidates[0].Content.Parts {
    if part.Text != "" {
      if part.Thought {
        fmt.Println("Thoughts Summary:")
        fmt.Println(part.Text)
      } else {
        fmt.Println("Answer:")
        fmt.Println(part.Text)
      }
    }
  }
}

यहां स्ट्रीमिंग के साथ सोच-समझकर जवाब देने की प्रोसेस का इस्तेमाल करने का एक उदाहरण दिया गया है. इससे, जनरेट होने के दौरान, खास जानकारी के रोलिंग और इन्क्रीमेंटल वर्शन मिलते हैं:

Python

from google import genai
from google.genai import types

client = genai.Client()

prompt = """
Alice, Bob, and Carol each live in a different house on the same street: red, green, and blue.
The person who lives in the red house owns a cat.
Bob does not live in the green house.
Carol owns a dog.
The green house is to the left of the red house.
Alice does not own a cat.
Who lives in each house, and what pet do they own?
"""

thoughts = ""
answer = ""

for chunk in client.models.generate_content_stream(
    model="gemini-3-flash-preview",
    contents=prompt,
    config=types.GenerateContentConfig(
      thinking_config=types.ThinkingConfig(
        include_thoughts=True
      )
    )
):
  for part in chunk.candidates[0].content.parts:
    if not part.text:
      continue
    elif part.thought:
      if not thoughts:
        print("Thoughts summary:")
      print(part.text)
      thoughts += part.text
    else:
      if not answer:
        print("Answer:")
      print(part.text)
      answer += part.text

JavaScript

import { GoogleGenAI } from "@google/genai";

const ai = new GoogleGenAI({});

const prompt = `Alice, Bob, and Carol each live in a different house on the same
street: red, green, and blue. The person who lives in the red house owns a cat.
Bob does not live in the green house. Carol owns a dog. The green house is to
the left of the red house. Alice does not own a cat. Who lives in each house,
and what pet do they own?`;

let thoughts = "";
let answer = "";

async function main() {
  const response = await ai.models.generateContentStream({
    model: "gemini-3-flash-preview",
    contents: prompt,
    config: {
      thinkingConfig: {
        includeThoughts: true,
      },
    },
  });

  for await (const chunk of response) {
    for (const part of chunk.candidates[0].content.parts) {
      if (!part.text) {
        continue;
      } else if (part.thought) {
        if (!thoughts) {
          console.log("Thoughts summary:");
        }
        console.log(part.text);
        thoughts = thoughts + part.text;
      } else {
        if (!answer) {
          console.log("Answer:");
        }
        console.log(part.text);
        answer = answer + part.text;
      }
    }
  }
}

await main();

ऐप पर जाएं

package main

import (
  "context"
  "fmt"
  "log"
  "os"
  "google.golang.org/genai"
)

const prompt = `
Alice, Bob, and Carol each live in a different house on the same street: red, green, and blue.
The person who lives in the red house owns a cat.
Bob does not live in the green house.
Carol owns a dog.
The green house is to the left of the red house.
Alice does not own a cat.
Who lives in each house, and what pet do they own?
`

func main() {
  ctx := context.Background()
  client, err := genai.NewClient(ctx, nil)
  if err != nil {
      log.Fatal(err)
  }

  contents := genai.Text(prompt)
  model := "gemini-3-flash-preview"

  resp := client.Models.GenerateContentStream(ctx, model, contents, &genai.GenerateContentConfig{
    ThinkingConfig: &genai.ThinkingConfig{
      IncludeThoughts: true,
    },
  })

  for chunk := range resp {
    for _, part := range chunk.Candidates[0].Content.Parts {
      if len(part.Text) == 0 {
        continue
      }

      if part.Thought {
        fmt.Printf("Thought: %s\n", part.Text)
      } else {
        fmt.Printf("Answer: %s\n", part.Text)
      }
    }
  }
}

सोच-समझकर जवाब देने की प्रोसेस को कंट्रोल करना

Gemini मॉडल, डिफ़ॉल्ट रूप से डाइनैमिक थिंकिंग में शामिल होते हैं. ये उपयोगकर्ता के अनुरोध की जटिलता के आधार पर, रीज़निंग के लिए ज़रूरी कोशिश को अपने-आप अडजस्ट करते हैं. हालांकि, अगर आपको खास लेटेंसी की पाबंदियां लागू करनी हैं या मॉडल से सामान्य से ज़्यादा गहराई से रीज़निंग करानी है, तो सोच-समझकर जवाब देने की प्रोसेस के व्यवहार को कंट्रोल करने के लिए, पैरामीटर का इस्तेमाल किया जा सकता है.

सोच-समझकर जवाब देने की प्रोसेस के लेवल (Gemini 3)

thinkingLevel पैरामीटर, Gemini 3 और इसके बाद के मॉडल के लिए इस्तेमाल करने का सुझाव दिया जाता है. इससे, रीज़निंग के व्यवहार को कंट्रोल किया जा सकता है.

यहां दी गई टेबल में, हर मॉडल टाइप के लिए thinkingLevel सेटिंग की जानकारी दी गई है:

सोच-समझकर जवाब देने की प्रोसेस का लेवल	Gemini 3.1 Pro	Gemini 3.1 Flash-Lite	Gemini 3 Flash	ब्यौरा
`minimal`	काम नहीं करता है	काम करता है (डिफ़ॉल्ट)	काम करता है	ज़्यादातर क्वेरी के लिए, "सोच-समझकर जवाब न देने" की सेटिंग से मेल खाता है. मुश्किल कोडिंग टास्क के लिए, मॉडल बहुत कम सोच-समझकर जवाब दे सकता है. चैट या ज़्यादा थ्रूपुट वाले ऐप्लिकेशन के लिए, लेटेंसी को कम करता है. ध्यान दें, `minimal` का मतलब यह नहीं है कि सोच-समझकर जवाब देने की प्रोसेस बंद है.
`low`	काम करता है	काम करता है	काम करता है	लेटेंसी और लागत को कम करता है. निर्देशों को आसानी से फ़ॉलो करने, चैट या ज़्यादा थ्रूपुट वाले ऐप्लिकेशन के लिए सबसे सही है.
`medium`	काम करता है	काम करता है	काम करता है	ज़्यादातर टास्क के लिए, सोच-समझकर जवाब देने की प्रोसेस का बैलेंस लेवल.
`high`	काम करता है (डिफ़ॉल्ट, डाइनैमिक)	काम करता है (डाइनैमिक)	काम करता है (डिफ़ॉल्ट, डाइनैमिक)	रीज़निंग की गहराई को बढ़ाता है. मॉडल को पहले (बिना सोच-समझकर जवाब देने वाले) आउटपुट टोकन तक पहुंचने में काफ़ी समय लग सकता है, लेकिन आउटपुट ज़्यादा सोच-समझकर दिया जाएगा.

यहां दिए गए उदाहरण में, सोच-समझकर जवाब देने की प्रोसेस का लेवल सेट करने का तरीका दिखाया गया है.

Python

from google import genai
from google.genai import types

client = genai.Client()

response = client.models.generate_content(
    model="gemini-3-flash-preview",
    contents="Provide a list of 3 famous physicists and their key contributions",
    config=types.GenerateContentConfig(
        thinking_config=types.ThinkingConfig(thinking_level="low")
    ),
)

print(response.text)

JavaScript

import { GoogleGenAI, ThinkingLevel } from "@google/genai";

const ai = new GoogleGenAI({});

async function main() {
  const response = await ai.models.generateContent({
    model: "gemini-3-flash-preview",
    contents: "Provide a list of 3 famous physicists and their key contributions",
    config: {
      thinkingConfig: {
        thinkingLevel: ThinkingLevel.LOW,
      },
    },
  });

  console.log(response.text);
}

main();

ऐप पर जाएं

package main

import (
  "context"
  "fmt"
  "google.golang.org/genai"
  "os"
)

func main() {
  ctx := context.Background()
  client, err := genai.NewClient(ctx, nil)
  if err != nil {
      log.Fatal(err)
  }

  thinkingLevelVal := "low"

  contents := genai.Text("Provide a list of 3 famous physicists and their key contributions")
  model := "gemini-3-flash-preview"
  resp, _ := client.Models.GenerateContent(ctx, model, contents, &genai.GenerateContentConfig{
    ThinkingConfig: &genai.ThinkingConfig{
      ThinkingLevel: &thinkingLevelVal,
    },
  })

fmt.Println(resp.Text())
}

REST

curl "https://generativelanguage.googleapis.com/v1beta/models/gemini-3-flash-preview:generateContent" \
-H "x-goog-api-key: $GEMINI_API_KEY" \
-H 'Content-Type: application/json' \
-X POST \
-d '{
  "contents": [
    {
      "parts": [
        {
          "text": "Provide a list of 3 famous physicists and their key contributions"
        }
      ]
    }
  ],
  "generationConfig": {
    "thinkingConfig": {
          "thinkingLevel": "low"
    }
  }
}'

Gemini 3.1 Pro के लिए, सोच-समझकर जवाब देने की प्रोसेस को बंद नहीं किया जा सकता. Gemini 3 Flash और Flash-Lite के लिए भी, सोच-समझकर जवाब देने की प्रोसेस को पूरी तरह से बंद नहीं किया जा सकता. हालांकि, minimal सेटिंग का मतलब है कि मॉडल शायद ही सोच-समझकर जवाब देगा (हालांकि, ऐसा हो सकता है). अगर सोच-समझकर जवाब देने की प्रोसेस का कोई लेवल तय नहीं किया जाता है, तो Gemini, Gemini 3 मॉडल के डिफ़ॉल्ट डाइनैमिक थिंकिंग लेवल, "high" का इस्तेमाल करेगा.

Gemini 2.5 सीरीज़ के मॉडल, thinkingLevel के साथ काम नहीं करते. इसके बजाय, thinkingBudget का इस्तेमाल करें.

सोच-समझकर जवाब देने की प्रोसेस के बजट

thinkingBudget पैरामीटर, Gemini 2.5 सीरीज़ के साथ लॉन्च किया गया था. यह मॉडल को रीज़निंग के लिए, सोच-समझकर जवाब देने वाले टोकन की तय संख्या का इस्तेमाल करने के बारे में बताता है.

यहां हर मॉडल टाइप के लिए, thinkingBudget के कॉन्फ़िगरेशन की जानकारी दी गई है. thinkingBudget को 0 पर सेट करके, सोच-समझकर जवाब देने की प्रोसेस को बंद किया जा सकता है. thinkingBudget को -1 पर सेट करने से, डाइनैमिक थिंकिंग चालू हो जाती है. इसका मतलब है कि मॉडल, अनुरोध की जटिलता के आधार पर बजट को अडजस्ट करेगा.

मॉडल	डिफ़ॉल्ट सेटिंग (सोच-समझकर जवाब देने की प्रोसेस का बजट सेट नहीं है)	रेंज	सोच-समझकर जवाब देने की प्रोसेस को बंद करना	डाइनैमिक थिंकिंग चालू करना
2.5 Pro	डाइनैमिक थिंकिंग	`128` से `32768`	लागू नहीं: सोच-समझकर जवाब देने की प्रोसेस को बंद नहीं किया जा सकता	`thinkingBudget = -1` (डिफ़ॉल्ट)
2.5 Flash	डाइनैमिक थिंकिंग	`0` से `24576`	`thinkingBudget = 0`	`thinkingBudget = -1` (डिफ़ॉल्ट)
2.5 Flash Preview	डाइनैमिक थिंकिंग	`0` से `24576`	`thinkingBudget = 0`	`thinkingBudget = -1` (डिफ़ॉल्ट)
2.5 Flash Lite	मॉडल सोच-समझकर जवाब नहीं देता	`512` से `24576`	`thinkingBudget = 0`	`thinkingBudget = -1`
2.5 Flash Lite Preview	मॉडल सोच-समझकर जवाब नहीं देता	`512` से `24576`	`thinkingBudget = 0`	`thinkingBudget = -1`
Robotics-ER 1.6 Preview	डाइनैमिक थिंकिंग	`0` से `24576`	`thinkingBudget = 0`	`thinkingBudget = -1` (डिफ़ॉल्ट)
2.5 Flash Live Native Audio Preview (09-2025)	डाइनैमिक थिंकिंग	`0` से `24576`	`thinkingBudget = 0`	`thinkingBudget = -1` (डिफ़ॉल्ट)

Python

from google import genai
from google.genai import types

client = genai.Client()

response = client.models.generate_content(
    model="gemini-2.5-flash",
    contents="Provide a list of 3 famous physicists and their key contributions",
    config=types.GenerateContentConfig(
        thinking_config=types.ThinkingConfig(thinking_budget=1024)
        # Turn off thinking:
        # thinking_config=types.ThinkingConfig(thinking_budget=0)
        # Turn on dynamic thinking:
        # thinking_config=types.ThinkingConfig(thinking_budget=-1)
    ),
)

print(response.text)

JavaScript

import { GoogleGenAI } from "@google/genai";

const ai = new GoogleGenAI({});

async function main() {
  const response = await ai.models.generateContent({
    model: "gemini-2.5-flash",
    contents: "Provide a list of 3 famous physicists and their key contributions",
    config: {
      thinkingConfig: {
        thinkingBudget: 1024,
        // Turn off thinking:
        // thinkingBudget: 0
        // Turn on dynamic thinking:
        // thinkingBudget: -1
      },
    },
  });

  console.log(response.text);
}

main();

ऐप पर जाएं

package main

import (
  "context"
  "fmt"
  "google.golang.org/genai"
  "os"
)

func main() {
  ctx := context.Background()
  client, err := genai.NewClient(ctx, nil)
  if err != nil {
      log.Fatal(err)
  }

  thinkingBudgetVal := int32(1024)

  contents := genai.Text("Provide a list of 3 famous physicists and their key contributions")
  model := "gemini-2.5-flash"
  resp, _ := client.Models.GenerateContent(ctx, model, contents, &genai.GenerateContentConfig{
    ThinkingConfig: &genai.ThinkingConfig{
      ThinkingBudget: &thinkingBudgetVal,
      // Turn off thinking:
      // ThinkingBudget: int32(0),
      // Turn on dynamic thinking:
      // ThinkingBudget: int32(-1),
    },
  })

fmt.Println(resp.Text())
}

REST

curl "https://generativelanguage.googleapis.com/v1beta/models/gemini-2.5-flash:generateContent" \
-H "x-goog-api-key: $GEMINI_API_KEY" \
-H 'Content-Type: application/json' \
-X POST \
-d '{
  "contents": [
    {
      "parts": [
        {
          "text": "Provide a list of 3 famous physicists and their key contributions"
        }
      ]
    }
  ],
  "generationConfig": {
    "thinkingConfig": {
          "thinkingBudget": 1024
    }
  }
}'

प्रॉम्प्ट के आधार पर, मॉडल टोकन बजट से ज़्यादा या कम टोकन का इस्तेमाल कर सकता है.

सोच-समझकर जवाब देने की प्रोसेस के सिग्नेचर

Gemini API, स्टेटलेस है. इसलिए, मॉडल हर एपीआई अनुरोध को अलग-अलग तरीके से प्रोसेस करता है. साथ ही, कई चरणों वाली बातचीत में, पिछले चरणों से मिले सोच-समझकर जवाब देने की प्रोसेस के कॉन्टेक्स्ट को ऐक्सेस नहीं कर पाता.

कई चरणों वाली बातचीत में, सोच-समझकर जवाब देने की प्रोसेस के कॉन्टेक्स्ट को बनाए रखने के लिए, Gemini, सोच-समझकर जवाब देने की प्रोसेस के सिग्नेचर दिखाता है. ये मॉडल की इंटरनल सोच-समझकर जवाब देने की प्रोसेस के एन्क्रिप्टेड वर्शन होते हैं.

Gemini 2.5 मॉडल , सोच-समझकर जवाब देने की प्रोसेस के सिग्नेचर तब दिखाते हैं, जब सोच-समझकर जवाब देने की प्रोसेस चालू हो और अनुरोध में फ़ंक्शन कॉल करने की सुविधा शामिल हो. खास तौर पर, फ़ंक्शन के एलान शामिल हों.
Gemini 3 मॉडल सभी तरह के हिस्सों के लिए, सोच-समझकर जवाब देने की प्रोसेस के सिग्नेचर दिखा सकते हैं. हमारा सुझाव है कि आपको मिले सभी सिग्नेचर को वापस भेजें. हालांकि, फ़ंक्शन कॉल करने के सिग्नेचर के लिए यह ज़रूरी है. ज़्यादा जानने के लिए, सोच-समझकर जवाब देने की प्रोसेस के सिग्नेचर वाला पेज पढ़ें.

फ़ंक्शन कॉल करने की सुविधा के साथ, इस्तेमाल की अन्य सीमाओं के बारे में यहां बताया गया है:

सिग्नेचर, जवाब के अन्य हिस्सों में मॉडल से मिलते हैं. जैसे, फ़ंक्शन कॉल करने या टेक्स्ट वाले हिस्से. पूरा जवाब अगले चरणों में, सभी हिस्सों के साथ मॉडल को वापस भेजें.
सिग्नेचर वाले हिस्सों को एक साथ न जोड़ें.
सिग्नेचर वाले किसी हिस्से को, बिना सिग्नेचर वाले किसी अन्य हिस्से के साथ न मिलाएं.

कीमत

सोच-समझकर जवाब देने की प्रोसेस चालू होने पर, जवाब की कीमत, आउटपुट टोकन और सोच-समझकर जवाब देने वाले टोकन की संख्या के योग के बराबर होती है. thoughtsTokenCount फ़ील्ड से, जनरेट किए गए सोच-समझकर जवाब देने वाले टोकन की कुल संख्या पाई जा सकती है.

Python

# ...
print("Thoughts tokens:",response.usage_metadata.thoughts_token_count)
print("Output tokens:",response.usage_metadata.candidates_token_count)

JavaScript

// ...
console.log(`Thoughts tokens: ${response.usageMetadata.thoughtsTokenCount}`);
console.log(`Output tokens: ${response.usageMetadata.candidatesTokenCount}`);

ऐप पर जाएं

// ...
usageMetadata, err := json.MarshalIndent(response.UsageMetadata, "", "  ")
if err != nil {
  log.Fatal(err)
}
fmt.Println("Thoughts tokens:", string(usageMetadata.thoughts_token_count))
fmt.Println("Output tokens:", string(usageMetadata.candidates_token_count))

सोच-समझकर जवाब देने वाले मॉडल, फ़ाइनल जवाब की क्वालिटी बेहतर बनाने के लिए, पूरी तरह से सोच-समझकर जवाब देते हैं. इसके बाद, सोच-समझकर जवाब देने की प्रोसेस के बारे में अहम जानकारी देने के लिए, खास जानकारी आउटपुट करते हैं. इसलिए, कीमत, सोच-समझकर जवाब देने वाले उन टोकन की संख्या के आधार पर तय की जाती है जिन्हें मॉडल को खास जानकारी जनरेट करने के लिए इस्तेमाल करना पड़ता है. भले ही, एपीआई से सिर्फ़ खास जानकारी आउटपुट की गई हो.

टोकन के बारे में ज़्यादा जानने के लिए, टोकन की संख्या गिनने की गाइड पढ़ें.

सबसे सही तरीके

इस सेक्शन में, सोच-समझकर जवाब देने वाले मॉडल का असरदार तरीके से इस्तेमाल करने के बारे में कुछ दिशा-निर्देश दिए गए हैं. हमेशा की तरह, हमारे प्रॉम्प्ट लिखने के दिशा-निर्देशों और सबसे सही तरीकों को फ़ॉलो करने से, आपको सबसे अच्छे नतीजे मिलेंगे.

डीबग करना और स्टीयरिंग

रीज़निंग की समीक्षा करना: जब आपको सोच-समझकर जवाब देने वाले मॉडल से, उम्मीद के मुताबिक जवाब नहीं मिल रहा है, तो Gemini की सोच-समझकर जवाब देने की प्रोसेस की खास जानकारी का ध्यान से विश्लेषण करना मददगार साबित हो सकता है. इससे यह देखा जा सकता है कि मॉडल ने टास्क को कैसे बांटा और नतीजे पर कैसे पहुंचा. साथ ही, इस जानकारी का इस्तेमाल करके, सही नतीजे पाए जा सकते हैं.
रीज़निंग में दिशा-निर्देश देना: अगर आपको खास तौर पर लंबा आउटपुट चाहिए, तो अपने प्रॉम्प्ट में दिशा-निर्देश दिए जा सकते हैं. इससे, मॉडल के सोच-समझकर जवाब देने की प्रोसेस की मात्रा को सीमित किया जा सकता है. सोच-समझकर जवाब देने की प्रोसेस इससे, जवाब के लिए ज़्यादा टोकन आउटपुट रिज़र्व किया जा सकता है.

टास्क की जटिलता

आसान टास्क (सोच-समझकर जवाब देने की प्रोसेस बंद की जा सकती है): सीधे-सीधे अनुरोधों के लिए, जिनमें जटिल रीज़निंग की ज़रूरत नहीं होती, सोच-समझकर जवाब देने की प्रोसेस की ज़रूरत नहीं होती. जैसे, किसी तथ्य को वापस पाना या कैटगरी तय करना. उदाहरण के लिए:
- "DeepMind की स्थापना कहां हुई थी?"
- "क्या इस ईमेल में मीटिंग के लिए कहा गया है या सिर्फ़ जानकारी दी गई है?"
मीडियम टास्क (डिफ़ॉल्ट/कुछ सोच-समझकर जवाब देना): कई सामान्य अनुरोधों को चरण-दर-चरण प्रोसेस करने या ज़्यादा गहराई से समझने से फ़ायदा मिलता है. Gemini, सोच-समझकर जवाब देने की प्रोसेस की क्षमता का इस्तेमाल, इन टास्क के लिए कर सकता है:
- प्रकाश संश्लेषण और बड़े होने की तुलना करना.
- इलेक्ट्रिक कारों और हाइब्रिड कारों की तुलना करना.
मुश्किल टास्क (सोच-समझकर जवाब देने की प्रोसेस की ज़्यादा से ज़्यादा क्षमता): मुश्किल चुनौतियों के लिए, जैसे कि गणित की मुश्किल समस्याओं को हल करना या कोडिंग टास्क, हमारा सुझाव है कि सोच-समझकर जवाब देने की प्रोसेस का ज़्यादा बजट सेट करें. इन टास्क के लिए, मॉडल को अपनी पूरी रीज़निंग और प्लानिंग की क्षमताओं का इस्तेमाल करना पड़ता है. अक्सर, जवाब देने से पहले, इसमें कई इंटरनल चरण शामिल होते हैं. उदाहरण के लिए:
- AIME 2025 में समस्या 1 को हल करें: सभी पूर्णांक आधार b > 9 का योग निकालें, जिसके लिए 17_b, 97_b का भाजक है.
- किसी वेब ऐप्लिकेशन के लिए Python कोड लिखें, जो रीयल-टाइम में शेयर बाज़ार का डेटा दिखाता है. इसमें उपयोगकर्ता की पुष्टि करने की सुविधा भी शामिल हो. इसे ज़्यादा से ज़्यादा असरदार बनाएं.

काम करने वाले मॉडल, टूल, और क्षमताएं

सोच-समझकर जवाब देने की प्रोसेस की सुविधाएं, 3 और 2.5 सीरीज़ के सभी मॉडल पर काम करती हैं. मॉडल की सभी क्षमताओं के बारे में, मॉडल की खास जानकारी वाले पेज पर जाना जा सकता है.

सोच-समझकर जवाब देने वाले मॉडल, Gemini के सभी टूल और क्षमताओं के साथ काम करते हैं. इससे मॉडल, बाहरी सिस्टम के साथ इंटरैक्ट कर सकते हैं, कोड को एक्ज़ीक्यूट कर सकते हैं या रीयल-टाइम में जानकारी ऐक्सेस कर सकते हैं. साथ ही, नतीजों को अपनी रीज़निंग और फ़ाइनल जवाब में शामिल कर सकते हैं.

सोच-समझकर जवाब देने वाले मॉडल के साथ टूल का इस्तेमाल करने के उदाहरण, सोच-समझकर जवाब देने की प्रोसेस की कुकबुक में देखे जा सकते हैं.

आगे क्या करना है?

सोच-समझकर जवाब देने की प्रोसेस की कवरेज, हमारी OpenAI के साथ कंपैटिबिलिटी गाइड में उपलब्ध है.