Starting April 29, 2025, Gemini 1.5 Pro and Gemini 1.5 Flash models are not available in projects that have no prior usage of these models, including new projects. For details, see
Model versions and lifecycle.
Create a context cache
Stay organized with collections
Save and categorize content based on your preferences.
Create a context cache to reduce costs with repeated requests that contain the same token count input.
Explore further
For detailed documentation that includes this code sample, see the following:
Code sample
Except as otherwise noted, the content of this page is licensed under the Creative Commons Attribution 4.0 License, and code samples are licensed under the Apache 2.0 License. For details, see the Google Developers Site Policies. Java is a registered trademark of Oracle and/or its affiliates.
[[["Easy to understand","easyToUnderstand","thumb-up"],["Solved my problem","solvedMyProblem","thumb-up"],["Other","otherUp","thumb-up"]],[["Hard to understand","hardToUnderstand","thumb-down"],["Incorrect information or sample code","incorrectInformationOrSampleCode","thumb-down"],["Missing the information/samples I need","missingTheInformationSamplesINeed","thumb-down"],["Other","otherDown","thumb-down"]],[],[],[],null,["# Create a context cache to reduce costs with repeated requests that contain the same token count input.\n\nExplore further\n---------------\n\n\nFor detailed documentation that includes this code sample, see the following:\n\n- [Create a context cache](/vertex-ai/generative-ai/docs/context-cache/context-cache-create)\n\nCode sample\n-----------\n\n### Go\n\n\nBefore trying this sample, follow the Go setup instructions in the\n[Vertex AI quickstart using\nclient libraries](/vertex-ai/docs/start/client-libraries).\n\n\nFor more information, see the\n[Vertex AI Go API\nreference documentation](/go/docs/reference/cloud.google.com/go/aiplatform/latest/apiv1).\n\n\nTo authenticate to Vertex AI, set up Application Default Credentials.\nFor more information, see\n\n[Set up authentication for a local development environment](/docs/authentication/set-up-adc-local-dev-environment).\n\n import (\n \t\"context\"\n \t\"encoding/json\"\n \t\"fmt\"\n \t\"io\"\n \t\"time\"\n\n \tgenai \"google.golang.org/genai\"\n )\n\n // createContentCache shows how to create a content cache with an expiration parameter.\n func createContentCache(w io.Writer) (string, error) {\n \tctx := context.Background()\n\n \tclient, err := genai.NewClient(ctx, &genai.ClientConfig{\n \t\tHTTPOptions: genai.HTTPOptions{APIVersion: \"v1\"},\n \t})\n \tif err != nil {\n \t\treturn \"\", fmt.Errorf(\"failed to create genai client: %w\", err)\n \t}\n\n \tmodelName := \"gemini-2.5-flash\"\n\n \tsystemInstruction := \"You are an expert researcher. You always stick to the facts \" +\n \t\t\"in the sources provided, and never make up new facts. \" +\n \t\t\"Now look at these research papers, and answer the following questions.\"\n\n \tcacheContents := []*genai.Content{\n \t\t{\n \t\t\tParts: []*genai.Part{\n \t\t\t\t{FileData: &genai.FileData{\n \t\t\t\t\tFileURI: \"gs://cloud-samples-data/generative-ai/pdf/2312.11805v3.pdf\",\n \t\t\t\t\tMIMEType: \"application/pdf\",\n \t\t\t\t}},\n \t\t\t\t{FileData: &genai.FileData{\n \t\t\t\t\tFileURI: \"gs://cloud-samples-data/generative-ai/pdf/2403.05530.pdf\",\n \t\t\t\t\tMIMEType: \"application/pdf\",\n \t\t\t\t}},\n \t\t\t},\n \t\t\tRole: \"user\",\n \t\t},\n \t}\n \tconfig := &genai.CreateCachedContentConfig{\n \t\tContents: cacheContents,\n \t\tSystemInstruction: &genai.Content{\n \t\t\tParts: []*genai.Part{\n \t\t\t\t{Text: systemInstruction},\n \t\t\t},\n \t\t},\n \t\tDisplayName: \"example-cache\",\n \t\tTTL: time.Duration(time.Duration.Seconds(86400)),\n \t}\n\n \tres, err := client.Caches.Create(ctx, modelName, config)\n \tif err != nil {\n \t\treturn \"\", fmt.Errorf(\"failed to create content cache: %w\", err)\n \t}\n\n \tcachedContent, err := json.MarshalIndent(res, \"\", \" \")\n \tif err != nil {\n \t\treturn \"\", fmt.Errorf(\"failed to marshal cache info: %w\", err)\n \t}\n\n \t// See the documentation: https://pkg.go.dev/google.golang.org/genai#CachedContent\n \tfmt.Fprintln(w, string(cachedContent))\n\n \t// Example response:\n \t// {\n \t// \"name\": \"projects/111111111111/locations/us-central1/cachedContents/1111111111111111111\",\n \t// \"displayName\": \"example-cache\",\n \t// \"model\": \"projects/111111111111/locations/us-central1/publishers/google/models/gemini-2.5-flash\",\n \t// \"createTime\": \"2025-02-18T15:05:08.29468Z\",\n \t// \"updateTime\": \"2025-02-18T15:05:08.29468Z\",\n \t// \"expireTime\": \"2025-02-19T15:05:08.280828Z\",\n \t// \"usageMetadata\": {\n \t// \"imageCount\": 167,\n \t// \"textCount\": 153,\n \t// \"totalTokenCount\": 43125\n \t// }\n \t// }\n\n \treturn res.Name, nil\n }\n\n### Python\n\n\nBefore trying this sample, follow the Python setup instructions in the\n[Vertex AI quickstart using\nclient libraries](/vertex-ai/docs/start/client-libraries).\n\n\nFor more information, see the\n[Vertex AI Python API\nreference documentation](/python/docs/reference/aiplatform/latest).\n\n\nTo authenticate to Vertex AI, set up Application Default Credentials.\nFor more information, see\n\n[Set up authentication for a local development environment](/docs/authentication/set-up-adc-local-dev-environment).\n\n from google import genai\n from google.genai.types import Content, CreateCachedContentConfig, HttpOptions, Part\n\n client = genai.Client(http_options=HttpOptions(api_version=\"v1\"))\n\n system_instruction = \"\"\"\n You are an expert researcher. You always stick to the facts in the sources provided, and never make up new facts.\n Now look at these research papers, and answer the following questions.\n \"\"\"\n\n contents = [\n Content(\n role=\"user\",\n parts=[\n Part.from_uri(\n file_uri=\"gs://cloud-samples-data/generative-ai/pdf/2312.11805v3.pdf\",\n mime_type=\"application/pdf\",\n ),\n Part.from_uri(\n file_uri=\"gs://cloud-samples-data/generative-ai/pdf/2403.05530.pdf\",\n mime_type=\"application/pdf\",\n ),\n ],\n )\n ]\n\n content_cache = client.caches.create(\n model=\"gemini-2.5-flash\",\n config=CreateCachedContentConfig(\n contents=contents,\n system_instruction=system_instruction,\n # (Optional) For enhanced security, the content cache can be encrypted using a Cloud KMS key\n # kms_key_name = \"projects/.../locations/us-central1/keyRings/.../cryptoKeys/...\"\n display_name=\"example-cache\",\n ttl=\"86400s\",\n ),\n )\n\n print(content_cache.name)\n print(content_cache.usage_metadata)\n # Example response:\n # projects/111111111111/locations/us-central1/cachedContents/1111111111111111111\n # CachedContentUsageMetadata(audio_duration_seconds=None, image_count=167,\n # text_count=153, total_token_count=43130, video_duration_seconds=None)\n\nWhat's next\n-----------\n\n\nTo search and filter code samples for other Google Cloud products, see the\n[Google Cloud sample browser](/docs/samples?product=googlegenaisdk)."]]