Skip to content

Commit

Permalink
Feature/inferenceservice (#1034)
Browse files Browse the repository at this point in the history
* chore: update inferenceservice yaml

* chore: update copyright
  • Loading branch information
gujingit committed Feb 1, 2024
1 parent 875d002 commit 8739eb5
Show file tree
Hide file tree
Showing 2 changed files with 55 additions and 39 deletions.
22 changes: 20 additions & 2 deletions charts/kserve/templates/inferenceservice.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -49,8 +49,6 @@ spec:
{{- if .Values.modelFormat.version }}
version: {{ .Values.modelFormat.version | quote }}
{{- end }}
{{- end }}
{{- if .Values.storageUri }}
{{- if .Values.runtime }}
runtime: {{ .Values.runtime }}
{{- end }}
Expand Down Expand Up @@ -104,6 +102,16 @@ spec:
{{- if gt (int $gpuCore) 0 }}
aliyun.com/gpu-core.percentage: {{ .Values.gpuCore }}
{{- end }}
requests:
{{- if gt (int $gpuCount) 0}}
nvidia.com/gpu: {{ .Values.gpuCount }}
{{- end }}
{{- if gt (int $gpuMemory) 0}}
aliyun.com/gpu-mem: {{ .Values.gpuMemory }}
{{- end }}
{{- if gt (int $gpuCore) 0 }}
aliyun.com/gpu-core.percentage: {{ .Values.gpuCore }}
{{- end }}
volumeMounts:
{{- if .Values.shareMemory }}
- mountPath: /dev/shm
Expand Down Expand Up @@ -162,6 +170,16 @@ spec:
protocol: TCP
{{- end }}
resources:
requests:
{{- if gt (int $gpuCount) 0}}
nvidia.com/gpu: {{ .Values.gpuCount }}
{{- end }}
{{- if gt (int $gpuMemory) 0}}
aliyun.com/gpu-mem: {{ .Values.gpuMemory }}
{{- end }}
{{- if gt (int $gpuCore) 0 }}
aliyun.com/gpu-core.percentage: {{ .Values.gpuCore }}
{{- end }}
limits:
{{- if .Values.cpu }}
cpu: {{ .Values.cpu }}
Expand Down
72 changes: 35 additions & 37 deletions mkdocs.yml
Original file line number Diff line number Diff line change
Expand Up @@ -7,55 +7,53 @@ nav:
- Home: index.md
- Installation: installation/index.md
- User Guide:
- Training Job Guide: training/index.md
- Serving Job Guide: serving/index.md
- Display Resource Usage Guide: top/index.md
- Supports Multiple Users Guide: multiple-users.md
- Isolate Users In Namespace: isolate-users-in-namespace.md
- Training Job Guide: training/index.md
- Serving Job Guide: serving/index.md
- Display Resource Usage Guide: top/index.md
- Supports Multiple Users Guide: multiple-users.md
- Isolate Users In Namespace: isolate-users-in-namespace.md
- SDK:
- Golang: sdk/go/index.md
- Golang: sdk/go/index.md
- Release Notes:
- v0.9.11: releases/v0.9.11.md
- v0.9.10: releases/v0.9.10.md
- v0.9.9: releases/v0.9.9.md
- v0.9.8: releases/v0.9.8.md
- v0.9.7: releases/v0.9.7.md
- v0.9.6: releases/v0.9.6.md
- v0.9.5: releases/v0.9.5.md
- v0.9.4: releases/v0.9.4.md
- v0.9.3: releases/v0.9.3.md
- v0.9.2: releases/v0.9.2.md
- v0.9.1: releases/v0.9.1.md
- v0.9.0: releases/v0.9.0.md
- v0.8.9: releases/v0.8.9.md
- v0.8.8: releases/v0.8.8.md
- v0.8.7: releases/v0.8.7.md
- v0.8.6: releases/v0.8.6.md
- v0.8.5: releases/v0.8.5.md
- v0.8.0: releases/v0.8.0.md
- v0.7.0: releases/v0.7.0.md
- v0.4.0: releases/v0.4.0.md
- v0.3.0: releases/v0.3.0.md
- v0.2.0: releases/v0.2.0.md
- v0.1.0: releases/v0.1.0.md
- v0.9.11: releases/v0.9.11.md
- v0.9.10: releases/v0.9.10.md
- v0.9.9: releases/v0.9.9.md
- v0.9.8: releases/v0.9.8.md
- v0.9.7: releases/v0.9.7.md
- v0.9.6: releases/v0.9.6.md
- v0.9.5: releases/v0.9.5.md
- v0.9.4: releases/v0.9.4.md
- v0.9.3: releases/v0.9.3.md
- v0.9.2: releases/v0.9.2.md
- v0.9.1: releases/v0.9.1.md
- v0.9.0: releases/v0.9.0.md
- v0.8.9: releases/v0.8.9.md
- v0.8.8: releases/v0.8.8.md
- v0.8.7: releases/v0.8.7.md
- v0.8.6: releases/v0.8.6.md
- v0.8.5: releases/v0.8.5.md
- v0.8.0: releases/v0.8.0.md
- v0.7.0: releases/v0.7.0.md
- v0.4.0: releases/v0.4.0.md
- v0.3.0: releases/v0.3.0.md
- v0.2.0: releases/v0.2.0.md
- v0.1.0: releases/v0.1.0.md
- FAQ: faq/index.md
- About:
- Adopter: about/ADOPTERS.md
- About:
- Adopter: about/ADOPTERS.md

theme:
theme:
name: material
#name: mkdocs
#name: readthedocs
highlightjs: true
hljs_languages:
- yaml
- django

markdown_extensions:
- admonition
- admonition

copyright: Copyright &copy; 2021 <a href="https://github.com/happy2048">Junfeng Yang</a>, Maintained by the Arena Team.
copyright: Copyright &copy 2024. Maintained by the Arena Team.

plugins:
- search
- search

0 comments on commit 8739eb5

Please sign in to comment.