NexusGPU
diff --git a/‎charts/tensor-fusion/.helmignore‎
Lines changed: 23 additions & 0 deletions b/‎charts/tensor-fusion/.helmignore‎
Lines changed: 23 additions & 0 deletions
diff --git a/‎charts/tensor-fusion/Chart.yaml‎
Lines changed: 24 additions & 0 deletions b/‎charts/tensor-fusion/Chart.yaml‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎charts/tensor-fusion/crds/tensor-fusion.ai_gpunodeclasses.yaml‎
Lines changed: 112 additions & 0 deletions b/‎charts/tensor-fusion/crds/tensor-fusion.ai_gpunodeclasses.yaml‎
Lines changed: 112 additions & 0 deletions
diff --git a/‎charts/tensor-fusion/crds/tensor-fusion.ai_gpunodes.yaml‎
Lines changed: 176 additions & 0 deletions b/‎charts/tensor-fusion/crds/tensor-fusion.ai_gpunodes.yaml‎
Lines changed: 176 additions & 0 deletions
@@ -0,0 +1,23 @@
+# Patterns to ignore when building packages.
+# This supports shell glob matching, relative path matching, and
+# negation (prefixed with !). Only one pattern per line.
+.DS_Store
+# Common VCS dirs
+.git/
+.gitignore
+.bzr/
+.bzrignore
+.hg/
+.hgignore
+.svn/
+# Common backup files
+*.swp
+*.bak
+*.tmp
+*.orig
+*~
+# Various IDEs
+.project
+.idea/
+*.tmproj
+.vscode/
@@ -0,0 +1,24 @@
+apiVersion: v2
+name: tensor-fusion
+description: A Helm chart for Kubernetes
+
+# A chart can be either an 'application' or a 'library' chart.
+#
+# Application charts are a collection of templates that can be packaged into versioned archives
+# to be deployed.
+#
+# Library charts provide useful utilities or functions for the chart developer. They're included as
+# a dependency of application charts to inject those utilities and functions into the rendering
+# pipeline. Library charts do not define any templates and therefore cannot be deployed.
+type: application
+
+# This is the chart version. This version number should be incremented each time you make changes
+# to the chart and its templates, including the app version.
+# Versions are expected to follow Semantic Versioning (https://semver.org/)
+version: 0.1.0
+
+# This is the version number of the application being deployed. This version number should be
+# incremented each time you make changes to the application. Versions are not expected to
+# follow Semantic Versioning. They should reflect the version the application is using.
+# It is recommended to use it with quotes.
+appVersion: "1.16.0"
@@ -0,0 +1,112 @@
+---
+apiVersion: apiextensions.k8s.io/v1
+kind: CustomResourceDefinition
+metadata:
+  annotations:
+    controller-gen.kubebuilder.io/version: v0.16.4
+  name: gpunodeclasses.tensor-fusion.ai
+spec:
+  group: tensor-fusion.ai
+  names:
+    kind: GPUNodeClass
+    listKind: GPUNodeClassList
+    plural: gpunodeclasses
+    singular: gpunodeclass
+  scope: Cluster
+  versions:
+  - name: v1
+    schema:
+      openAPIV3Schema:
+        description: GPUNodeClass is the Schema for the gpunodeclasses API.
+        properties:
+          apiVersion:
+            description: |-
+              APIVersion defines the versioned schema of this representation of an object.
+              Servers should convert recognized schemas to the latest internal value, and
+              may reject unrecognized values.
+              More info: https://git.k8s.io/community/contributors/devel/sig-architecture/api-conventions.md#resources
+            type: string
+          kind:
+            description: |-
+              Kind is a string value representing the REST resource this object represents.
+              Servers may infer this from the endpoint the client submits requests to.
+              Cannot be updated.
+              In CamelCase.
+              More info: https://git.k8s.io/community/contributors/devel/sig-architecture/api-conventions.md#types-kinds
+            type: string
+          metadata:
+            type: object
+          spec:
+            description: GPUNodeClassSpec defines the desired state of GPUNodeClass.
+            properties:
+              blockDeviceMappings:
+                items:
+                  properties:
+                    deviceName:
+                      type: string
+                    ebs:
+                      properties:
+                        deleteOnTermination:
+                          type: boolean
+                        encrypted:
+                          type: boolean
+                        volumeSize:
+                          type: string
+                        volumeType:
+                          type: string
+                      type: object
+                  type: object
+                type: array
+              instanceProfile:
+                type: string
+              metadataOptions:
+                properties:
+                  httpEndpoint:
+                    type: string
+                  httpProtocolIPv6:
+                    type: string
+                  httpPutResponseHopLimit:
+                    type: integer
+                  httpTokens:
+                    type: string
+                type: object
+              osImageFamily:
+                type: string
+              osImageSelectorTerms:
+                items:
+                  properties:
+                    name:
+                      type: string
+                    owner:
+                      type: string
+                  type: object
+                type: array
+              securityGroupSelectorTerms:
+                items:
+                  properties:
+                    id:
+                      type: string
+                  type: object
+                type: array
+              subnetSelectorTerms:
+                items:
+                  properties:
+                    id:
+                      type: string
+                  type: object
+                type: array
+              tags:
+                additionalProperties:
+                  type: string
+                type: object
+              userData:
+                type: string
+            type: object
+          status:
+            description: GPUNodeClassStatus defines the observed state of GPUNodeClass.
+            type: object
+        type: object
+    served: true
+    storage: true
+    subresources:
+      status: {}
@@ -0,0 +1,176 @@
+---
+apiVersion: apiextensions.k8s.io/v1
+kind: CustomResourceDefinition
+metadata:
+  annotations:
+    controller-gen.kubebuilder.io/version: v0.16.4
+  name: gpunodes.tensor-fusion.ai
+spec:
+  group: tensor-fusion.ai
+  names:
+    kind: GPUNode
+    listKind: GPUNodeList
+    plural: gpunodes
+    singular: gpunode
+  scope: Cluster
+  versions:
+  - name: v1
+    schema:
+      openAPIV3Schema:
+        description: GPUNode is the Schema for the gpunodes API.
+        properties:
+          apiVersion:
+            description: |-
+              APIVersion defines the versioned schema of this representation of an object.
+              Servers should convert recognized schemas to the latest internal value, and
+              may reject unrecognized values.
+              More info: https://git.k8s.io/community/contributors/devel/sig-architecture/api-conventions.md#resources
+            type: string
+          kind:
+            description: |-
+              Kind is a string value representing the REST resource this object represents.
+              Servers may infer this from the endpoint the client submits requests to.
+              Cannot be updated.
+              In CamelCase.
+              More info: https://git.k8s.io/community/contributors/devel/sig-architecture/api-conventions.md#types-kinds
+            type: string
+          metadata:
+            type: object
+          spec:
+            description: GPUNodeSpec defines the desired state of GPUNode.
+            properties:
+              gpuCardIndices:
+                description: |-
+                  if not all GPU cards should be used, specify the GPU card indices, default to empty,
+                  onboard all GPU cards to the pool
+                items:
+                  type: integer
+                type: array
+              manageMode:
+                type: string
+            type: object
+          status:
+            description: GPUNodeStatus defines the observed state of GPUNode.
+            properties:
+              availableTFlops:
+                format: int32
+                type: integer
+              availableVRAM:
+                type: string
+              conditions:
+                items:
+                  description: Condition contains details for one aspect of the current
+                    state of this API Resource.
+                  properties:
+                    lastTransitionTime:
+                      description: |-
+                        lastTransitionTime is the last time the condition transitioned from one status to another.
+                        This should be when the underlying condition changed.  If that is not known, then using the time when the API field changed is acceptable.
+                      format: date-time
+                      type: string
+                    message:
+                      description: |-
+                        message is a human readable message indicating details about the transition.
+                        This may be an empty string.
+                      maxLength: 32768
+                      type: string
+                    observedGeneration:
+                      description: |-
+                        observedGeneration represents the .metadata.generation that the condition was set based upon.
+                        For instance, if .metadata.generation is currently 12, but the .status.conditions[x].observedGeneration is 9, the condition is out of date
+                        with respect to the current state of the instance.
+                      format: int64
+                      minimum: 0
+                      type: integer
+                    reason:
+                      description: |-
+                        reason contains a programmatic identifier indicating the reason for the condition's last transition.
+                        Producers of specific condition types may define expected values and meanings for this field,
+                        and whether the values are considered a guaranteed API.
+                        The value should be a CamelCase string.
+                        This field may not be empty.
+                      maxLength: 1024
+                      minLength: 1
+                      pattern: ^[A-Za-z]([A-Za-z0-9_,:]*[A-Za-z0-9_])?$
+                      type: string
+                    status:
+                      description: status of the condition, one of True, False, Unknown.
+                      enum:
+                      - "True"
+                      - "False"
+                      - Unknown
+                      type: string
+                    type:
+                      description: type of condition in CamelCase or in foo.example.com/CamelCase.
+                      maxLength: 316
+                      pattern: ^([a-z0-9]([-a-z0-9]*[a-z0-9])?(\.[a-z0-9]([-a-z0-9]*[a-z0-9])?)*/)?(([A-Za-z0-9][-A-Za-z0-9_.]*)?[A-Za-z0-9])$
+                      type: string
+                  required:
+                  - lastTransitionTime
+                  - message
+                  - reason
+                  - status
+                  - type
+                  type: object
+                type: array
+              hypervisorStatus:
+                properties:
+                  hypervisorState:
+                    type: string
+                  hypervisorVersion:
+                    type: string
+                  lastHeartbeatTime:
+                    format: date-time
+                    type: string
+                type: object
+              loadedModels:
+                items:
+                  type: string
+                type: array
+              managedGPUResourceIDs:
+                items:
+                  type: string
+                type: array
+              managedGPUs:
+                format: int32
+                type: integer
+              nodeInfo:
+                properties:
+                  architecture:
+                    type: string
+                  gpuCount:
+                    format: int32
+                    type: integer
+                  gpuDriverVersion:
+                    type: string
+                  gpuModel:
+                    type: string
+                  hostname:
+                    type: string
+                  ip:
+                    type: string
+                  kernalVersion:
+                    type: string
+                  operatingSystem:
+                    type: string
+                  osImage:
+                    type: string
+                type: object
+              phase:
+                description: TensorFusionClusterPhase represents the phase of the
+                  TensorFusionCluster resource.
+                type: string
+              totalGPUs:
+                format: int32
+                type: integer
+              totalTFlops:
+                format: int32
+                type: integer
+              totalVRAM:
+                type: string
+            type: object
+        type: object
+    served: true
+    storage: true
+    subresources:
+      status: {}