Merge pull request #176 from kerthcet/cleanup/update-installation

InftyAI-Agent · web-flow · commit f8b1f7c5aa2c · 2024-09-26T19:29:56.000+08:00
Update Revision default to main
diff --git a/api/core/v1alpha1/model_types.go b/api/core/v1alpha1/model_types.go
@@ -46,7 +46,7 @@ type ModelHub struct {
 	// in the near future.
 	Filename *string `json:"filename,omitempty"`
 	// Revision refers to a Git revision id which can be a branch name, a tag, or a commit hash.
-	// Most of the time, you don't need to specify it.
+	// +kubebuilder:default=main
 	// +optional
 	Revision *string `json:"revision,omitempty"`
 }
diff --git a/config/crd/bases/llmaz.io_openmodels.yaml b/config/crd/bases/llmaz.io_openmodels.yaml
@@ -130,9 +130,9 @@ spec:
                         - ModelScope
                         type: string
                       revision:
-                        description: |-
-                          Revision refers to a Git revision id which can be a branch name, a tag, or a commit hash.
-                          Most of the time, you don't need to specify it.
+                        default: main
+                        description: Revision refers to a Git revision id which can
+                          be a branch name, a tag, or a commit hash.
                         type: string
                     type: object
                   uri:
diff --git a/pkg/controller_helper/model_source/modelsource_test.go b/pkg/controller_helper/model_source/modelsource_test.go
@@ -39,7 +39,7 @@ func Test_ModelSourceProvider(t *testing.T) {
 		},
 		{
 			name:          "modelhub with GGUF file",
-			model:         wrapper.MakeModel("test-7b").FamilyName("test").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf").Obj(),
+			model:         wrapper.MakeModel("test-7b").FamilyName("test").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf", "").Obj(),
 			wantModelName: "test-7b",
 			wantModelPath: "/workspace/models/qwen2-0_5b-instruct-q5_k_m.gguf",
 		},
diff --git a/test/e2e/playground_test.go b/test/e2e/playground_test.go
@@ -48,7 +48,7 @@ var _ = ginkgo.Describe("playground e2e tests", func() {
 	})
 
 	ginkgo.It("Deploy a huggingface model with llama.cpp", func() {
-		model := wrapper.MakeModel("qwen2-0-5b-gguf").FamilyName("qwen2").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf").Obj()
+		model := wrapper.MakeModel("qwen2-0-5b-gguf").FamilyName("qwen2").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf", "").Obj()
 		gomega.Expect(k8sClient.Create(ctx, model)).To(gomega.Succeed())
 		defer func() {
 			gomega.Expect(k8sClient.Delete(ctx, model)).To(gomega.Succeed())
@@ -73,7 +73,7 @@ var _ = ginkgo.Describe("playground e2e tests", func() {
 			Request("cpu", "2").Request("memory", "4Gi").Limit("cpu", "4").Limit("memory", "4Gi").Obj()
 		gomega.Expect(k8sClient.Create(ctx, backendRuntime)).To(gomega.Succeed())
 
-		model := wrapper.MakeModel("qwen2-0-5b-gguf").FamilyName("qwen2").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf").Obj()
+		model := wrapper.MakeModel("qwen2-0-5b-gguf").FamilyName("qwen2").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf", "").Obj()
 		gomega.Expect(k8sClient.Create(ctx, model)).To(gomega.Succeed())
 		defer func() {
 			gomega.Expect(k8sClient.Delete(ctx, model)).To(gomega.Succeed())
@@ -92,12 +92,12 @@ var _ = ginkgo.Describe("playground e2e tests", func() {
 	})
 	// TODO: add e2e tests.
 	// ginkgo.It("SpeculativeDecoding with llama.cpp", func() {
-	// 	targetModel := wrapper.MakeModel("llama2-7b-q8-gguf").FamilyName("llama2").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("TheBloke/Llama-2-7B-GGUF", "llama-2-7b.Q8_0.gguf").Obj()
+	// 	targetModel := wrapper.MakeModel("llama2-7b-q8-gguf").FamilyName("llama2").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("TheBloke/Llama-2-7B-GGUF", "llama-2-7b.Q8_0.gguf", "").Obj()
 	// 	gomega.Expect(k8sClient.Create(ctx, targetModel)).To(gomega.Succeed())
 	// 	defer func() {
 	// 		gomega.Expect(k8sClient.Delete(ctx, targetModel)).To(gomega.Succeed())
 	// 	}()
-	// 	draftModel := wrapper.MakeModel("llama2-7b-q2-k-gguf").FamilyName("llama2").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("TheBloke/Llama-2-7B-GGUF", "llama-2-7b.Q2_K.gguf").Obj()
+	// 	draftModel := wrapper.MakeModel("llama2-7b-q2-k-gguf").FamilyName("llama2").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("TheBloke/Llama-2-7B-GGUF", "llama-2-7b.Q2_K.gguf", "").Obj()
 	// 	gomega.Expect(k8sClient.Create(ctx, draftModel)).To(gomega.Succeed())
 	// 	defer func() {
 	// 		gomega.Expect(k8sClient.Delete(ctx, draftModel)).To(gomega.Succeed())
diff --git a/test/integration/controller/inference/playground_test.go b/test/integration/controller/inference/playground_test.go
@@ -57,7 +57,7 @@ var _ = ginkgo.Describe("playground controller test", func() {
 		gomega.Expect(k8sClient.Create(ctx, ns)).To(gomega.Succeed())
 		model = util.MockASampleModel()
 		gomega.Expect(k8sClient.Create(ctx, model)).To(gomega.Succeed())
-		draftModel = wrapper.MakeModel("llama3-2b").FamilyName("llama3").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("meta-llama/Meta-Llama-3-2B", "").Obj()
+		draftModel = wrapper.MakeModel("llama3-2b").FamilyName("llama3").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("meta-llama/Meta-Llama-3-2B", "", "").Obj()
 		gomega.Expect(k8sClient.Create(ctx, draftModel)).To(gomega.Succeed())
 	})
 	ginkgo.AfterEach(func() {
diff --git a/test/integration/webhook/model_test.go b/test/integration/webhook/model_test.go
@@ -52,18 +52,18 @@ var _ = ginkgo.Describe("model default and validation", func() {
 		},
 		ginkgo.Entry("apply model family name", &testDefaultingCase{
 			model: func() *coreapi.OpenModel {
-				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "").FamilyName("llama3").Obj()
+				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "", "").FamilyName("llama3").Obj()
 			},
 			wantModel: func() *coreapi.OpenModel {
-				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "").ModelSourceWithModelHub("Huggingface").FamilyName("llama3").Label(coreapi.ModelFamilyNameLabelKey, "llama3").Obj()
+				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "", "main").ModelSourceWithModelHub("Huggingface").FamilyName("llama3").Label(coreapi.ModelFamilyNameLabelKey, "llama3").Obj()
 			},
 		}),
 		ginkgo.Entry("apply modelscope model hub name", &testDefaultingCase{
 			model: func() *coreapi.OpenModel {
-				return wrapper.MakeModel("llama3-8b").FamilyName("llama3").ModelSourceWithModelHub("ModelScope").ModelSourceWithModelID("LLM-Research/Meta-Llama-3-8B", "").Obj()
+				return wrapper.MakeModel("llama3-8b").FamilyName("llama3").ModelSourceWithModelHub("ModelScope").ModelSourceWithModelID("LLM-Research/Meta-Llama-3-8B", "", "").Obj()
 			},
 			wantModel: func() *coreapi.OpenModel {
-				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelID("LLM-Research/Meta-Llama-3-8B", "").ModelSourceWithModelHub("ModelScope").FamilyName("llama3").Label(coreapi.ModelFamilyNameLabelKey, "llama3").Obj()
+				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelID("LLM-Research/Meta-Llama-3-8B", "", "main").ModelSourceWithModelHub("ModelScope").FamilyName("llama3").Label(coreapi.ModelFamilyNameLabelKey, "llama3").Obj()
 			},
 		}),
 	)
@@ -83,19 +83,19 @@ var _ = ginkgo.Describe("model default and validation", func() {
 		},
 		ginkgo.Entry("default normal huggingface model creation", &testValidatingCase{
 			model: func() *coreapi.OpenModel {
-				return wrapper.MakeModel("llama3-8b").FamilyName("llama3").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "").Obj()
+				return wrapper.MakeModel("llama3-8b").FamilyName("llama3").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "", "").Obj()
 			},
 			failed: false,
 		}),
 		ginkgo.Entry("normal modelScope model creation", &testValidatingCase{
 			model: func() *coreapi.OpenModel {
-				return wrapper.MakeModel("llama3-8b").FamilyName("llama3").ModelSourceWithModelHub("ModelScope").ModelSourceWithModelID("LLM-Research/Meta-Llama-3-8B", "").Obj()
+				return wrapper.MakeModel("llama3-8b").FamilyName("llama3").ModelSourceWithModelHub("ModelScope").ModelSourceWithModelID("LLM-Research/Meta-Llama-3-8B", "", "").Obj()
 			},
 			failed: false,
 		}),
 		ginkgo.Entry("invalid model name", &testValidatingCase{
 			model: func() *coreapi.OpenModel {
-				return wrapper.MakeModel("qwen-2-0.5b").FamilyName("qwen2").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct", "").Obj()
+				return wrapper.MakeModel("qwen-2-0.5b").FamilyName("qwen2").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct", "", "").Obj()
 			},
 			failed: true,
 		}),
@@ -131,13 +131,13 @@ var _ = ginkgo.Describe("model default and validation", func() {
 		}),
 		ginkgo.Entry("set filename when modelHub is Huggingface", &testValidatingCase{
 			model: func() *coreapi.OpenModel {
-				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf").FamilyName("llama3").Obj()
+				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf", "").FamilyName("llama3").Obj()
 			},
 			failed: false,
 		}),
 		ginkgo.Entry("set filename when modelHub is ModelScope", &testValidatingCase{
 			model: func() *coreapi.OpenModel {
-				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelHub("ModelScope").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf").FamilyName("llama3").Obj()
+				return wrapper.MakeModel("llama3-8b").ModelSourceWithModelHub("ModelScope").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf", "").FamilyName("llama3").Obj()
 			},
 			failed: true,
 		}),
diff --git a/test/util/mock.go b/test/util/mock.go
@@ -26,7 +26,7 @@ const (
 )
 
 func MockASampleModel() *coreapi.OpenModel {
-	return wrapper.MakeModel(sampleModelName).FamilyName("llama3").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "").Obj()
+	return wrapper.MakeModel(sampleModelName).FamilyName("llama3").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "", "").Obj()
 }
 
 func MockASamplePlayground(ns string) *inferenceapi.Playground {
diff --git a/test/util/wrapper/model.go b/test/util/wrapper/model.go
@@ -47,7 +47,7 @@ func (w *ModelWrapper) FamilyName(name string) *ModelWrapper {
 	return w
 }
 
-func (w *ModelWrapper) ModelSourceWithModelID(modelID string, filename string) *ModelWrapper {
+func (w *ModelWrapper) ModelSourceWithModelID(modelID string, filename string, revision string) *ModelWrapper {
 	if modelID != "" {
 		if w.Spec.Source.ModelHub == nil {
 			w.Spec.Source.ModelHub = &coreapi.ModelHub{}
@@ -57,6 +57,10 @@ func (w *ModelWrapper) ModelSourceWithModelID(modelID string, filename string) *
 		if filename != "" {
 			w.Spec.Source.ModelHub.Filename = &filename
 		}
+
+		if revision != "" {
+			w.Spec.Source.ModelHub.Revision = &revision
+		}
 	}
 	return w
 }

Original file line number	Diff line number	Diff line change
`@@ -46,7 +46,7 @@ type ModelHub struct {`
`46`	`46`	`// in the near future.`
`47`	`47`	Filename *string `json:"filename,omitempty"`
`48`	`48`	`// Revision refers to a Git revision id which can be a branch name, a tag, or a commit hash.`
`49`		`- // Most of the time, you don't need to specify it.`
	`49`	`+ // +kubebuilder:default=main`
`50`	`50`	`// +optional`
`51`	`51`	Revision *string `json:"revision,omitempty"`
`52`	`52`	`}`
Original file line number	Diff line number	Diff line change
`@@ -39,7 +39,7 @@ func Test_ModelSourceProvider(t *testing.T) {`
`39`	`39`	`},`
`40`	`40`	`{`
`41`	`41`	`name: "modelhub with GGUF file",`
`42`		`- model: wrapper.MakeModel("test-7b").FamilyName("test").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf").Obj(),`
	`42`	`+ model: wrapper.MakeModel("test-7b").FamilyName("test").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("Qwen/Qwen2-0.5B-Instruct-GGUF", "qwen2-0_5b-instruct-q5_k_m.gguf", "").Obj(),`
`43`	`43`	`wantModelName: "test-7b",`
`44`	`44`	`wantModelPath: "/workspace/models/qwen2-0_5b-instruct-q5_k_m.gguf",`
`45`	`45`	`},`
Original file line number	Diff line number	Diff line change
`@@ -26,7 +26,7 @@ const (`
`26`	`26`	`)`
`27`	`27`
`28`	`28`	`func MockASampleModel() *coreapi.OpenModel {`
`29`		`- return wrapper.MakeModel(sampleModelName).FamilyName("llama3").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "").Obj()`
	`29`	`+ return wrapper.MakeModel(sampleModelName).FamilyName("llama3").ModelSourceWithModelHub("Huggingface").ModelSourceWithModelID("meta-llama/Meta-Llama-3-8B", "", "").Obj()`
`30`	`30`	`}`
`31`	`31`
`32`	`32`	`func MockASamplePlayground(ns string) *inferenceapi.Playground {`
Original file line number	Diff line number	Diff line change
`@@ -47,7 +47,7 @@ func (w ModelWrapper) FamilyName(name string) ModelWrapper {`
`47`	`47`	`return w`
`48`	`48`	`}`
`49`	`49`
`50`		`-func (w ModelWrapper) ModelSourceWithModelID(modelID string, filename string) ModelWrapper {`
	`50`	`+func (w ModelWrapper) ModelSourceWithModelID(modelID string, filename string, revision string) ModelWrapper {`
`51`	`51`	`if modelID != "" {`
`52`	`52`	`if w.Spec.Source.ModelHub == nil {`
`53`	`53`	`w.Spec.Source.ModelHub = &coreapi.ModelHub{}`
`@@ -57,6 +57,10 @@ func (w ModelWrapper) ModelSourceWithModelID(modelID string, filename string) `
`57`	`57`	`if filename != "" {`
`58`	`58`	`w.Spec.Source.ModelHub.Filename = &filename`
`59`	`59`	`}`
	`60`	`+`
	`61`	`+ if revision != "" {`
	`62`	`+ w.Spec.Source.ModelHub.Revision = &revision`
	`63`	`+ }`
`60`	`64`	`}`
`61`	`65`	`return w`
`62`	`66`	`}`