mudler
diff --git a/‎.github/workflows/image-pr.yml‎
Lines changed: 9 additions & 0 deletions b/‎.github/workflows/image-pr.yml‎
Lines changed: 9 additions & 0 deletions
diff --git a/‎.github/workflows/image.yml‎
Lines changed: 10 additions & 1 deletion b/‎.github/workflows/image.yml‎
Lines changed: 10 additions & 1 deletion
diff --git a/‎Dockerfile‎
Lines changed: 16 additions & 0 deletions b/‎Dockerfile‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎Makefile‎
Lines changed: 5 additions & 1 deletion b/‎Makefile‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎backend/backend.proto‎
Lines changed: 1 addition & 0 deletions b/‎backend/backend.proto‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎backend/go/llm/rwkv/rwkv.go‎
Lines changed: 1 addition & 1 deletion b/‎backend/go/llm/rwkv/rwkv.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎backend/go/transcribe/transcript.go‎
Lines changed: 5 additions & 1 deletion b/‎backend/go/transcribe/transcript.go‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎backend/go/transcribe/whisper.go‎
Lines changed: 1 addition & 1 deletion b/‎backend/go/transcribe/whisper.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎core/backend/llm.go‎
Lines changed: 1 addition & 1 deletion b/‎core/backend/llm.go‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎core/backend/transcript.go‎
Lines changed: 5 additions & 4 deletions b/‎core/backend/transcript.go‎
Lines changed: 5 additions & 4 deletions
@@ -128,3 +128,12 @@ jobs:
             runs-on: 'ubuntu-latest'
             base-image: "ubuntu:22.04"
             makeflags: "--jobs=4 --output-sync=target"
+          - build-type: 'vulkan'
+            platforms: 'linux/amd64'
+            tag-latest: 'false'
+            tag-suffix: '-vulkan-ffmpeg-core'
+            ffmpeg: 'true'
+            image-type: 'core'
+            runs-on: 'ubuntu-latest'
+            base-image: "ubuntu:22.04"
+            makeflags: "--jobs=4 --output-sync=target"
@@ -39,7 +39,7 @@ jobs:
     strategy:
       # Pushing with all jobs in parallel
       # eats the bandwidth of all the nodes
-      # max-parallel: ${{ github.event_name != 'pull_request' && 4 || 8 }}
+      max-parallel: ${{ github.event_name != 'pull_request' && 6 || 12 }}
       matrix:
         include:
           # Extra images
@@ -315,3 +315,12 @@ jobs:
             runs-on: 'arc-runner-set'
             base-image: "ubuntu:22.04"
             makeflags: "--jobs=4 --output-sync=target"
+          - build-type: 'vulkan'
+            platforms: 'linux/amd64,linux/arm64'
+            tag-latest: 'false'
+            tag-suffix: '-vulkan-ffmpeg-core'
+            ffmpeg: 'true'
+            image-type: 'core'
+            runs-on: 'arc-runner-set'
+            base-image: "ubuntu:22.04"
+            makeflags: "--jobs=4 --output-sync=target"
@@ -103,6 +103,22 @@ ARG CUDA_MINOR_VERSION=5
 
 ENV BUILD_TYPE=${BUILD_TYPE}
 
+# Vulkan requirements
+RUN <<EOT bash
+    if [ "${BUILD_TYPE}" = "vulkan" ]; then
+        apt-get update && \
+        apt-get install -y  --no-install-recommends \
+                        software-properties-common pciutils wget gpg-agent && \
+        wget -qO - https://packages.lunarg.com/lunarg-signing-key-pub.asc | apt-key add - && \
+        wget -qO /etc/apt/sources.list.d/lunarg-vulkan-jammy.list https://packages.lunarg.com/vulkan/lunarg-vulkan-jammy.list && \
+        apt-get update && \
+            apt-get install -y \
+            vulkan-sdk && \
+        apt-get clean && \
+        rm -rf /var/lib/apt/lists/*
+    fi
+EOT
+
 # CuBLAS requirements
 RUN <<EOT bash
     if [ "${BUILD_TYPE}" = "cublas" ]; then
 
@@ -5,7 +5,7 @@ BINARY_NAME=local-ai
 
 # llama.cpp versions
 GOLLAMA_STABLE_VERSION?=2b57a8ae43e4699d3dc5d1496a1ccd42922993be
-CPPLLAMA_VERSION?=557b653dc9ed91e8c313e87500e0050c775f81b6
+CPPLLAMA_VERSION?=e112b610a1a75cb7fa8351e1a933e2e7a755a5ce
 
 # gpt4all version
 GPT4ALL_REPO?=https://github.com/nomic-ai/gpt4all
@@ -103,6 +103,10 @@ ifeq ($(BUILD_TYPE),cublas)
 	CGO_LDFLAGS_WHISPER+=-L$(CUDA_LIBPATH)/stubs/ -lcuda -lcufft
 endif
 
+ifeq ($(BUILD_TYPE),vulkan)
+	CMAKE_ARGS+=-DLLAMA_VULKAN=1
+endif
+
 ifeq ($(BUILD_TYPE),hipblas)
 	ROCM_HOME ?= /opt/rocm
 	ROCM_PATH ?= /opt/rocm
 
@@ -230,6 +230,7 @@ message TranscriptRequest {
   string dst = 2;
   string language = 3;
   uint32 threads = 4;
+  bool translate = 5;
 }
 
 message TranscriptResult {
 
@@ -31,7 +31,7 @@ func (llm *LLM) Load(opts *pb.ModelOptions) error {
 	model := rwkv.LoadFiles(opts.ModelFile, tokenizerPath, uint32(opts.GetThreads()))
 
 	if model == nil {
-		return fmt.Errorf("could not load model")
+		return fmt.Errorf("rwkv could not load model")
 	}
 	llm.rwkv = model
 	return nil
 
@@ -29,7 +29,7 @@ func audioToWav(src, dst string) error {
 	return nil
 }
 
-func Transcript(model whisper.Model, audiopath, language string, threads uint) (schema.TranscriptionResult, error) {
+func Transcript(model whisper.Model, audiopath, language string, translate bool, threads uint) (schema.TranscriptionResult, error) {
 	res := schema.TranscriptionResult{}
 
 	dir, err := os.MkdirTemp("", "whisper")
@@ -75,6 +75,10 @@ func Transcript(model whisper.Model, audiopath, language string, threads uint) (
 		context.SetLanguage("auto")
 	}
 
+	if translate {
+		context.SetTranslate(true)
+	}
+
 	if err := context.Process(data, nil, nil); err != nil {
 		return res, err
 	}
 
@@ -22,5 +22,5 @@ func (sd *Whisper) Load(opts *pb.ModelOptions) error {
 }
 
 func (sd *Whisper) AudioTranscription(opts *pb.TranscriptRequest) (schema.TranscriptionResult, error) {
-	return Transcript(sd.whisper, opts.Dst, opts.Language, uint(opts.Threads))
+	return Transcript(sd.whisper, opts.Dst, opts.Language, opts.Translate, uint(opts.Threads))
 }
@@ -12,7 +12,7 @@ import (
 	"github.com/mudler/LocalAI/core/config"
 	"github.com/mudler/LocalAI/core/schema"
 
-	"github.com/mudler/LocalAI/pkg/gallery"
+	"github.com/mudler/LocalAI/core/gallery"
 	"github.com/mudler/LocalAI/pkg/grpc"
 	"github.com/mudler/LocalAI/pkg/grpc/proto"
 	model "github.com/mudler/LocalAI/pkg/model"
 
@@ -11,7 +11,7 @@ import (
 	model "github.com/mudler/LocalAI/pkg/model"
 )
 
-func ModelTranscription(audio, language string, ml *model.ModelLoader, backendConfig config.BackendConfig, appConfig *config.ApplicationConfig) (*schema.TranscriptionResult, error) {
+func ModelTranscription(audio, language string, translate bool, ml *model.ModelLoader, backendConfig config.BackendConfig, appConfig *config.ApplicationConfig) (*schema.TranscriptionResult, error) {
 
 	opts := modelOpts(backendConfig, appConfig, []model.Option{
 		model.WithBackendString(model.WhisperBackend),
@@ -31,8 +31,9 @@ func ModelTranscription(audio, language string, ml *model.ModelLoader, backendCo
 	}
 
 	return whisperModel.AudioTranscription(context.Background(), &proto.TranscriptRequest{
-		Dst:      audio,
-		Language: language,
-		Threads:  uint32(*backendConfig.Threads),
+		Dst:       audio,
+		Language:  language,
+		Translate: translate,
+		Threads:   uint32(*backendConfig.Threads),
 	})
 }
Original file line number	Diff line number	Diff line change
`@@ -230,6 +230,7 @@ message TranscriptRequest {`
`230`	`230`	`string dst = 2;`
`231`	`231`	`string language = 3;`
`232`	`232`	`uint32 threads = 4;`
	`233`	`+ bool translate = 5;`
`233`	`234`	`}`
`234`	`235`
`235`	`236`	`message TranscriptResult {`
Original file line number	Diff line number	Diff line change
`@@ -31,7 +31,7 @@ func (llm LLM) Load(opts pb.ModelOptions) error {`
`31`	`31`	`model := rwkv.LoadFiles(opts.ModelFile, tokenizerPath, uint32(opts.GetThreads()))`
`32`	`32`
`33`	`33`	`if model == nil {`
`34`		`- return fmt.Errorf("could not load model")`
	`34`	`+ return fmt.Errorf("rwkv could not load model")`
`35`	`35`	`}`
`36`	`36`	`llm.rwkv = model`
`37`	`37`	`return nil`
Original file line number	Diff line number	Diff line change
`@@ -29,7 +29,7 @@ func audioToWav(src, dst string) error {`
`29`	`29`	`return nil`
`30`	`30`	`}`
`31`	`31`
`32`		`-func Transcript(model whisper.Model, audiopath, language string, threads uint) (schema.TranscriptionResult, error) {`
	`32`	`+func Transcript(model whisper.Model, audiopath, language string, translate bool, threads uint) (schema.TranscriptionResult, error) {`
`33`	`33`	`res := schema.TranscriptionResult{}`
`34`	`34`
`35`	`35`	`dir, err := os.MkdirTemp("", "whisper")`
`@@ -75,6 +75,10 @@ func Transcript(model whisper.Model, audiopath, language string, threads uint) (`
`75`	`75`	`context.SetLanguage("auto")`
`76`	`76`	`}`
`77`	`77`
	`78`	`+ if translate {`
	`79`	`+ context.SetTranslate(true)`
	`80`	`+ }`
	`81`	`+`
`78`	`82`	`if err := context.Process(data, nil, nil); err != nil {`
`79`	`83`	`return res, err`
`80`	`84`	`}`
Original file line number	Diff line number	Diff line change
`@@ -22,5 +22,5 @@ func (sd Whisper) Load(opts pb.ModelOptions) error {`
`22`	`22`	`}`
`23`	`23`
`24`	`24`	`func (sd Whisper) AudioTranscription(opts pb.TranscriptRequest) (schema.TranscriptionResult, error) {`
`25`		`- return Transcript(sd.whisper, opts.Dst, opts.Language, uint(opts.Threads))`
	`25`	`+ return Transcript(sd.whisper, opts.Dst, opts.Language, opts.Translate, uint(opts.Threads))`
`26`	`26`	`}`
Original file line number	Diff line number	Diff line change
`@@ -11,7 +11,7 @@ import (`
`11`	`11`	`model "github.com/mudler/LocalAI/pkg/model"`
`12`	`12`	`)`
`13`	`13`
`14`		`-func ModelTranscription(audio, language string, ml model.ModelLoader, backendConfig config.BackendConfig, appConfig config.ApplicationConfig) (*schema.TranscriptionResult, error) {`
	`14`	`+func ModelTranscription(audio, language string, translate bool, ml model.ModelLoader, backendConfig config.BackendConfig, appConfig config.ApplicationConfig) (*schema.TranscriptionResult, error) {`
`15`	`15`
`16`	`16`	`opts := modelOpts(backendConfig, appConfig, []model.Option{`
`17`	`17`	`model.WithBackendString(model.WhisperBackend),`
`@@ -31,8 +31,9 @@ func ModelTranscription(audio, language string, ml *model.ModelLoader, backendCo`
`31`	`31`	`}`
`32`	`32`
`33`	`33`	`return whisperModel.AudioTranscription(context.Background(), &proto.TranscriptRequest{`
`34`		`- Dst: audio,`
`35`		`- Language: language,`
`36`		`- Threads: uint32(*backendConfig.Threads),`
	`34`	`+ Dst: audio,`
	`35`	`+ Language: language,`
	`36`	`+ Translate: translate,`
	`37`	`+ Threads: uint32(*backendConfig.Threads),`
`37`	`38`	`})`
`38`	`39`	`}`