> ## Documentation Index
> Fetch the complete documentation index at: https://gcore.com/docs/llms.txt
> Use this file to discover all available pages before exploring further.

# Update inference application deployment

> Updates an existing application deployment.
You can modify the target regions and update configurations for individual components.
To disable a component, set its value to null. Only the provided fields will be updated;
all others remain unchanged.



## OpenAPI

````yaml /api-reference/services_documented/cloud_api.yaml patch /cloud/v3/inference/applications/{project_id}/deployments/{deployment_name}
openapi: 3.1.0
info:
  title: Gcore OpenAPI – Cloud API
  description: >-
    This OpenAPI is an aggregated OpenAPI specification that unifies all Gcore
    products into a single file. It covers Cloud, CDN, DNS, WAAP, DDoS
    Protection, Object Storage, Streaming, and FastEdge services.
  version: '2026-05-15T06:37:28.230198+00:00'
servers:
  - url: https://api.gcore.com
security:
  - APIKey: []
tags:
  - name: Bare Metal
    x-displayName: Bare Metal
  - name: Container as a Service
    x-displayName: Container as a Service
  - name: Cost Reports
    x-displayName: Cost Reports
  - name: DDoS Protection
    x-displayName: DDoS Protection
  - name: Everywhere Inference
    x-displayName: Everywhere Inference
  - name: Everywhere Inference Apps
    x-displayName: Everywhere Inference Apps
  - name: File Shares
    x-displayName: File Shares
  - name: Floating IPs
    x-displayName: Floating IPs
  - name: Function as a Service
    x-displayName: Function as a Service
  - name: GPU Bare Metal
    x-displayName: GPU Bare Metal
  - name: GPU Virtual
    x-displayName: GPU Virtual
  - name: IP Ranges
    x-displayName: IP Ranges
  - name: Images
    x-displayName: Images
  - name: Instances
    x-displayName: Instances
  - name: Load Balancers
    x-displayName: Load Balancers
  - name: Logging
    x-displayName: Logging
  - name: Managed Kubernetes
    x-displayName: Managed Kubernetes
  - name: Managed PostgreSQL
    x-displayName: Managed PostgreSQL
  - name: Networks
    x-displayName: Networks
  - name: Placement Groups
    x-displayName: Placement Groups
  - name: Projects
    x-displayName: Projects
  - name: Quotas
    x-displayName: Quotas
  - name: Regions
    x-displayName: Regions
  - name: Registry
    x-displayName: Registry
  - name: Reservations
    x-displayName: Reservations
  - name: Reserved IPs
    x-displayName: Reserved IPs
  - name: Routers
    x-displayName: Routers
  - name: SSH Keys
    x-displayName: SSH Keys
  - name: Secrets
    x-displayName: Secrets
  - name: Security Groups
    x-displayName: Security Groups
  - name: Snapshot Schedules
    x-displayName: Snapshot Schedules
  - name: Snapshots
    x-displayName: Snapshots
  - name: Tasks
    x-displayName: Tasks
  - name: User Actions
    x-displayName: User Actions
  - name: User Role Assignments
    x-displayName: User Role Assignments
  - name: Volumes
    x-displayName: Volumes
paths:
  /cloud/v3/inference/applications/{project_id}/deployments/{deployment_name}:
    patch:
      tags:
        - Everywhere Inference Apps
      summary: Update inference application deployment
      description: >-
        Updates an existing application deployment.

        You can modify the target regions and update configurations for
        individual components.

        To disable a component, set its value to null. Only the provided fields
        will be updated;

        all others remain unchanged.
      operationId: InferenceApplicationDeployment.patch
      parameters:
        - in: path
          name: project_id
          required: true
          description: Project ID
          schema:
            description: Project ID
            example: 1
            examples:
              - 1
            title: Project Id
            type: integer
        - in: path
          name: deployment_name
          required: true
          description: Name of deployment
          schema:
            description: Name of deployment
            title: Deployment Name
            type: string
      requestBody:
        content:
          application/json:
            schema:
              $ref: '#/components/schemas/AppDeploymentPatchRequest'
      responses:
        '200':
          description: OK
          content:
            application/json:
              schema:
                $ref: '#/components/schemas/TaskIDsSerializer'
      x-codeSamples:
        - lang: Python
          source: >-
            import os

            from gcore import Gcore


            client = Gcore(
                api_key=os.environ.get("GCORE_API_KEY"),  # This is the default and can be omitted
            )

            task_id_list =
            client.cloud.inference.applications.deployments.update(
                deployment_name="deployment_name",
                project_id=1,
            )

            print(task_id_list.tasks)
        - lang: Go
          source: "package main\n\nimport (\n\t\"context\"\n\t\"fmt\"\n\n\t\"github.com/G-Core/gcore-go\"\n\t\"github.com/G-Core/gcore-go/cloud\"\n\t\"github.com/G-Core/gcore-go/option\"\n)\n\nfunc main() {\n\tclient := gcore.NewClient(\n\t\toption.WithAPIKey(\"My API Key\"),\n\t)\n\ttaskIDList, err := client.Cloud.Inference.Applications.Deployments.Update(\n\t\tcontext.TODO(),\n\t\t\"deployment_name\",\n\t\tcloud.InferenceApplicationDeploymentUpdateParams{\n\t\t\tProjectID: gcore.Int(1),\n\t\t},\n\t)\n\tif err != nil {\n\t\tpanic(err.Error())\n\t}\n\tfmt.Printf(\"%+v\\n\", taskIDList.Tasks)\n}\n"
components:
  schemas:
    AppDeploymentPatchRequest:
      properties:
        api_keys:
          description: List of API keys for the application
          example:
            - key1
            - key2
          examples:
            - - key1
              - key2
          items:
            type: string
          title: Api Keys
          type: array
        components_configuration:
          additionalProperties:
            anyOf:
              - $ref: '#/components/schemas/ComponentConfigurationPatch'
              - type: 'null'
          description: >-
            Mapping of component names to their configuration (e.g., `"model":
            {...}`)
          example:
            model:
              scale:
                max: 2
          examples:
            - model:
                scale:
                  max: 2
            - model:
                flavor: inference-16vcpu-232gib-1xh100-80gb
          title: Components Configuration
          type: object
        regions:
          description: Geographical regions to be updated for the deployment
          example:
            - 1
            - 2
          examples:
            - - 1
              - 2
          items:
            type: integer
          title: Regions
          type: array
      title: AppDeploymentPatchRequest
      type: object
    TaskIDsSerializer:
      properties:
        tasks:
          description: >-
            List of task IDs representing asynchronous operations. Use these IDs
            to monitor operation progress:

            - `GET /v1/tasks/{task_id}` - Check individual task status and
            details

            Poll task status until completion (`FINISHED`/`ERROR`) before
            proceeding with dependent operations.
          example:
            - d478ae29-dedc-4869-82f0-96104425f565
          examples:
            - - d478ae29-dedc-4869-82f0-96104425f565
          items:
            type: string
          title: Tasks
          type: array
      required:
        - tasks
      title: TaskIDsSerializer
      type: object
    ComponentConfigurationPatch:
      properties:
        exposed:
          description: >-
            Whether the component should be exposed via a public endpoint (e.g.,
            for external inference/API access).
          title: Exposed
          type: boolean
        flavor:
          description: >-
            Specifies the compute configuration (e.g., CPU/GPU size) to be used
            for the component.
          title: Flavor
          type: string
        parameter_overrides:
          additionalProperties:
            anyOf:
              - $ref: '#/components/schemas/ParameterOverride'
              - type: 'null'
          description: Map of parameter overrides for customization
          title: Parameter Overrides
          type: object
        scale:
          $ref: '#/components/schemas/ScalePatch'
          description: Scaling parameters of the component
      title: ComponentConfigurationPatch
      type: object
    ParameterOverride:
      properties:
        value:
          description: New value assigned to the overridden parameter
          title: Value
          type: string
      required:
        - value
      title: ParameterOverride
      type: object
    ScalePatch:
      properties:
        max:
          description: Maximum number of replicas the container can be scaled up to
          title: Max
          type: integer
        min:
          description: Minimum number of replicas the component can be scaled down to
          title: Min
          type: integer
      title: ScalePatch
      type: object
  securitySchemes:
    APIKey:
      description: >-
        API key for authentication. Make sure to include the word `apikey`,
        followed by a single space and then your token.

        Example: `apikey 1234$abcdef`
      type: apiKey
      in: header
      name: Authorization

````