> ## Documentation Index
> Fetch the complete documentation index at: https://gcore.com/docs/llms.txt
> Use this file to discover all available pages before exploring further.

# List inference flavors



## OpenAPI

````yaml /api-reference/services_docs_mintlify/cloud_api.yaml get /cloud/v3/inference/flavors
openapi: 3.1.0
info:
  title: Gcore OpenAPI – Cloud API
  description: >-
    This OpenAPI is an aggregated OpenAPI specification that unifies all Gcore
    products into a single file. It covers Cloud, CDN, DNS, WAAP, DDoS
    Protection, Object Storage, Streaming, and FastEdge services.
  version: 2978be3a5492
servers:
  - url: https://api.gcore.com
security:
  - APIKey: []
tags:
  - name: Bare Metal
  - name: Container as a Service
  - name: Cost Reports
  - name: DDoS Protection
  - name: Everywhere Inference
  - name: Everywhere Inference Apps
  - name: File Shares
  - name: Floating IPs
  - name: Function as a Service
  - name: GPU Bare Metal
  - name: GPU Virtual
  - name: IP Ranges
  - name: Images
  - name: Instances
  - name: Load Balancers
  - name: Logging
  - name: Managed Kubernetes
  - name: Managed PostgreSQL
  - name: Networks
  - name: Placement Groups
  - name: Ports
  - name: Projects
  - name: Quotas
  - name: Regions
  - name: Registry
  - name: Reservations
  - name: Reserved IPs
  - name: Routers
  - name: SSH Keys
  - name: Secrets
  - name: Security Groups
  - name: Snapshot Schedules
  - name: Snapshots
  - name: Tasks
  - name: User Actions
  - name: User Role Assignments
  - name: Volumes
paths:
  /cloud/v3/inference/flavors:
    get:
      tags:
        - Everywhere Inference
      summary: List inference flavors
      operationId: InferenceFlavorsHandlerV3.get
      parameters:
        - in: query
          name: limit
          required: false
          description: Optional. Limit the number of returned items
          schema:
            default: 1000
            description: Optional. Limit the number of returned items
            example: 1000
            examples:
              - 1000
            exclusiveMinimum: 0
            maximum: 1000
            title: Limit
            type: integer
        - in: query
          name: offset
          required: false
          description: >-
            Optional. Offset value is used to exclude the first set of records
            from the result
          schema:
            default: 0
            description: >-
              Optional. Offset value is used to exclude the first set of records
              from the result
            example: 0
            examples:
              - 0
            minimum: 0
            title: Offset
            type: integer
      responses:
        '200':
          description: OK
          content:
            application/json:
              schema:
                $ref: '#/components/schemas/InferenceFlavorOutSerializerV3List'
components:
  schemas:
    InferenceFlavorOutSerializerV3List:
      properties:
        count:
          description: Number of objects
          example: 1
          examples:
            - 1
          minimum: 0
          title: Count
          type: integer
        results:
          description: Objects
          items:
            $ref: '#/components/schemas/InferenceFlavorOutSerializerV3'
          title: Results
          type: array
      required:
        - count
        - results
      title: InferenceFlavorOutSerializerV3List
      type: object
    InferenceFlavorOutSerializerV3:
      properties:
        cpu:
          description: Inference flavor cpu count.
          example: 2
          examples:
            - 2
          title: Cpu
          type: number
        description:
          description: Inference flavor description.
          example: 1xL40S / 16 vCPU / 232GiB RAM
          examples:
            - 1xL40S / 16 vCPU / 232GiB RAM
          title: Description
          type: string
        gpu:
          description: Inference flavor gpu count.
          example: 1
          examples:
            - 1
          title: Gpu
          type: integer
        gpu_compute_capability:
          description: Inference flavor gpu compute capability.
          example: '8.6'
          examples:
            - '8.6'
          title: Gpu Compute Capability
          type: string
        gpu_memory:
          description: Inference flavor gpu memory in Gi.
          example: 80
          examples:
            - 80
          title: Gpu Memory
          type: number
        gpu_model:
          description: Inference flavor gpu model.
          example: H100
          examples:
            - H100
          title: Gpu Model
          type: string
        is_gpu_shared:
          deprecated: true
          description: Inference flavor is gpu shared (always false, deprecated).
          example: false
          examples:
            - false
          title: Is Gpu Shared
          type: boolean
        memory:
          description: Inference flavor memory in Gi.
          example: 4
          examples:
            - 4
          title: Memory
          type: number
        name:
          description: Inference flavor name.
          example: inference-16vcpu-232gib-1xh100-80gb
          examples:
            - inference-16vcpu-232gib-1xh100-80gb
          title: Name
          type: string
      required:
        - name
        - cpu
        - memory
        - gpu
        - gpu_model
        - gpu_memory
        - is_gpu_shared
        - gpu_compute_capability
        - description
      title: InferenceFlavorOutSerializerV3
      type: object
  securitySchemes:
    APIKey:
      description: >-
        API key for authentication. Make sure to include the word `apikey`,
        followed by a single space and then your token.

        Example: `apikey 1234$abcdef`
      type: apiKey
      in: header
      name: Authorization

````