TrueChartsClone/charts/stable/fabulinus/values.yaml

image:
  repository: tytn/fabulinus
  pullPolicy: IfNotPresent
  tag: latest-cpu@sha256:f8b30eaa5b61d6085fc715f40619733846927c2266a3e20523e93fb58afeef38
gpuImage:
  repository: tytn/fabulinus
  pullPolicy: IfNotPresent
  tag: latest-gpu@sha256:9a826a578ca4157fbe3c091eb78aa35dfca6675f9fae24dcb90495ba4d9715d1

securityContext:
  container:
    readOnlyRootFilesystem: false
    runAsUser: 0
    runAsGroup: 0

service:
  main:
    ports:
      main:
        protocol: http
        targetPort: 80
        port: 10687

fabulinus:
  # cpu | gpu
  device: cpu
  model: "google/flan-t5-small"
  # int8 | float16 | bfloat16 | int8_float16 | int8_bfloat16
  quant_type: int8
  max_batch_size: 32
  disable_batching: true

workload:
  main:
    podSpec:
      containers:
        main:
          imageSelector: image
          probes:
            liveness:
              enabled: true
              type: http
              path: /docs
            readiness:
              enabled: true
              type: http
              path: /docs
            startup:
              enabled: true
              type: tcp
          env:
            TAKEOFF_DEVICE: "{{ .Values.fabulinus.device }}"
            TAKEOFF_MODEL_NAME: "{{ .Values.fabulinus.model }}"
            TAKEOFF_QUANT_TYPE: "{{ .Values.fabulinus.quant_type }}"
            TAKEOFF_MAX_BATCH_SIZE: "{{ .Values.fabulinus.max_batch_size }}"
            TAKEOFF_DISABLE_BATCHING: "{{ .Values.fabulinus.disable_batching }}"

persistence:
  models:
    enabled: true
    mountPath: "/code/models"

portal:
  open:
    enabled: true
feat(fabulinus) add fabulinus (#16909) Description Fabulinus is the server component of the TitanML Takeoff server. ⚒️ Fixes # <!--(issue)--> ⚙️ Type of change - [X] ⚙️ Feature/App addition - [ ] 🪛 Bugfix - [ ] ⚠️ Breaking change (fix or feature that would cause existing functionality to not work as expected) - [ ] 🔃 Refactor of current code 🧪 How Has This Been Tested? <!-- Please describe the tests that you ran to verify your changes. Provide instructions so we can reproduce. Please also list any relevant details for your test configuration --> 📃 Notes: <!-- Please enter any other relevant information here --> ✔️ Checklist: - [X] ⚖️ My code follows the style guidelines of this project - [X] 👀 I have performed a self-review of my own code - [ ] #️⃣ I have commented my code, particularly in hard-to-understand areas - [ ] 📄 I have made corresponding changes to the documentation - [ ] ⚠️ My changes generate no new warnings - [ ] 🧪 I have added tests to this description that prove my fix is effective or that my feature works - [ ] ⬆️ I increased versions for any altered app according to semantic versioning ➕ App addition If this PR is an app addition please make sure you have done the following. - [ ] 🪞 I have opened a PR on [truecharts/containers](https://github.com/truecharts/containers) adding the container to TrueCharts mirror repo. - [X] 🖼️ I have added an icon in the Chart's root directory called `icon.png` --- _Please don't blindly check all the boxes. Read them and only check those that apply. Those checkboxes are there for the reviewer to see what is this all about and the status of this PR with a quick glance._ 2024-01-09 18:13:43 +00:00			`image:`
			`repository: tytn/fabulinus`
			`pullPolicy: IfNotPresent`
			`tag: latest-cpu@sha256:f8b30eaa5b61d6085fc715f40619733846927c2266a3e20523e93fb58afeef38`
			`gpuImage:`
			`repository: tytn/fabulinus`
			`pullPolicy: IfNotPresent`
			`tag: latest-gpu@sha256:9a826a578ca4157fbe3c091eb78aa35dfca6675f9fae24dcb90495ba4d9715d1`

			`securityContext:`
			`container:`
			`readOnlyRootFilesystem: false`
			`runAsUser: 0`
			`runAsGroup: 0`

			`service:`
			`main:`
			`ports:`
			`main:`
			`protocol: http`
			`targetPort: 80`
			`port: 10687`

			`fabulinus:`
			`# cpu \| gpu`
			`device: cpu`
			`model: "google/flan-t5-small"`
			`# int8 \| float16 \| bfloat16 \| int8_float16 \| int8_bfloat16`
			`quant_type: int8`
			`max_batch_size: 32`
			`disable_batching: true`

			`workload:`
			`main:`
			`podSpec:`
			`containers:`
			`main:`
			`imageSelector: image`
			`probes:`
			`liveness:`
			`enabled: true`
			`type: http`
			`path: /docs`
			`readiness:`
			`enabled: true`
			`type: http`
			`path: /docs`
			`startup:`
			`enabled: true`
			`type: tcp`
			`env:`
			`TAKEOFF_DEVICE: "{{ .Values.fabulinus.device }}"`
			`TAKEOFF_MODEL_NAME: "{{ .Values.fabulinus.model }}"`
			`TAKEOFF_QUANT_TYPE: "{{ .Values.fabulinus.quant_type }}"`
			`TAKEOFF_MAX_BATCH_SIZE: "{{ .Values.fabulinus.max_batch_size }}"`
			`TAKEOFF_DISABLE_BATCHING: "{{ .Values.fabulinus.disable_batching }}"`

			`persistence:`
			`models:`
			`enabled: true`
			`mountPath: "/code/models"`

			`portal:`
			`open:`
			`enabled: true`