Skip to content

Commit b3de159

Browse files
committed
Fixed some GGUFv1 loading bugs, long overdue cleanup for compiling, integrated TTS
tts is functional (+6 squashed commit) Squashed commit: [2239631] wip tts [3a88302] tts not yet working [0dcfab0e] fix silly bug [a378d9e] some long overdue cleanup [fc5a6fb] Wip tts [39f5049] wip TTS integration
1 parent 12cdcf0 commit b3de159

File tree

17 files changed

+1176
-272
lines changed

17 files changed

+1176
-272
lines changed

CMakeLists.txt

Lines changed: 29 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -495,7 +495,9 @@ add_library(common2
495495
examples/llava/clip.h
496496
src/unicode.h
497497
src/unicode.cpp
498-
src/unicode-data.cpp)
498+
src/unicode-data.cpp
499+
otherarch/utils.cpp
500+
otherarch/utils.h)
499501
target_include_directories(common2 PUBLIC . ./ggml/include ./ggml/src ./ggml/src/ggml-cpu ./include ./otherarch ./otherarch/tools ./otherarch/sdcpp ./otherarch/sdcpp/thirdparty ./examples ./common)
500502
target_compile_features(common2 PUBLIC cxx_std_17) # don't bump
501503
target_link_libraries(common2 PRIVATE ggml ${LLAMA_EXTRA_LIBS})
@@ -515,11 +517,18 @@ target_compile_features(whisper_adapter PUBLIC cxx_std_17) # don't bump
515517
target_link_libraries(whisper_adapter PRIVATE common2 ggml ${LLAMA_EXTRA_LIBS})
516518
set_target_properties(whisper_adapter PROPERTIES POSITION_INDEPENDENT_CODE ON)
517519

520+
add_library(tts_adapter
521+
otherarch/tts_adapter.cpp)
522+
target_include_directories(tts_adapter PUBLIC . ./ggml/include ./ggml/src ./ggml/src/ggml-cpu ./include ./otherarch ./otherarch/tools ./examples ./common)
523+
target_compile_features(tts_adapter PUBLIC cxx_std_17) # don't bump
524+
target_link_libraries(tts_adapter PRIVATE common2 ggml ${LLAMA_EXTRA_LIBS})
525+
set_target_properties(tts_adapter PROPERTIES POSITION_INDEPENDENT_CODE ON)
526+
518527
add_library(gpttype_adapter
519528
gpttype_adapter.cpp)
520529
target_include_directories(gpttype_adapter PUBLIC . ./ggml/include ./ggml/src ./ggml/src/ggml-cpu ./include ./otherarch ./otherarch/tools ./otherarch/sdcpp ./otherarch/sdcpp/thirdparty ./examples ./common)
521530
target_compile_features(gpttype_adapter PUBLIC cxx_std_17) # don't bump
522-
target_link_libraries(gpttype_adapter PRIVATE common2 ggml ${LLAMA_EXTRA_LIBS})
531+
target_link_libraries(gpttype_adapter PRIVATE common2 ggml ggml_v1 ggml_v2 ggml_v3 ${LLAMA_EXTRA_LIBS})
523532
set_target_properties(gpttype_adapter PROPERTIES POSITION_INDEPENDENT_CODE ON)
524533

525534
if (LLAMA_CUBLAS)
@@ -530,8 +539,16 @@ if (LLAMA_CUBLAS)
530539
set_target_properties(${TARGET} PROPERTIES PREFIX "")
531540
set_target_properties(${TARGET} PROPERTIES OUTPUT_NAME "koboldcpp_cublas")
532541
set_target_properties(${TARGET} PROPERTIES POSITION_INDEPENDENT_CODE ON)
533-
target_link_libraries(${TARGET} PUBLIC Threads::Threads ggml ggml_v1 ggml_v2 ggml_v3 common2 gpttype_adapter whisper_adapter sdtype_adapter ${LLAMA_EXTRA_LIBS})
542+
target_link_libraries(${TARGET} PUBLIC Threads::Threads ggml ggml_v1 ggml_v2 ggml_v3 common2 gpttype_adapter whisper_adapter tts_adapter sdtype_adapter ${LLAMA_EXTRA_LIBS})
534543
target_compile_features(${TARGET} PRIVATE cxx_std_17)
544+
545+
add_custom_command(
546+
TARGET koboldcpp_cublas POST_BUILD
547+
COMMAND ${CMAKE_COMMAND} -E copy
548+
$<TARGET_FILE:koboldcpp_cublas> # The generated DLL
549+
${CMAKE_SOURCE_DIR}/ # Destination directory
550+
COMMENT "Copying DLL to parent directory"
551+
)
535552
endif()
536553

537554
if (LLAMA_HIPBLAS)
@@ -542,7 +559,15 @@ if (LLAMA_HIPBLAS)
542559
set_target_properties(${TARGET} PROPERTIES PREFIX "")
543560
set_target_properties(${TARGET} PROPERTIES OUTPUT_NAME "koboldcpp_hipblas")
544561
set_target_properties(${TARGET} PROPERTIES POSITION_INDEPENDENT_CODE ON)
545-
target_link_libraries(${TARGET} PUBLIC Threads::Threads ggml ggml_v1 ggml_v2 ggml_v3 common2 gpttype_adapter whisper_adapter sdtype_adapter ${LLAMA_EXTRA_LIBS})
562+
target_link_libraries(${TARGET} PUBLIC Threads::Threads ggml ggml_v1 ggml_v2 ggml_v3 common2 gpttype_adapter whisper_adapter tts_adapter sdtype_adapter ${LLAMA_EXTRA_LIBS})
546563
target_compile_features(${TARGET} PRIVATE cxx_std_17)
564+
565+
add_custom_command(
566+
TARGET koboldcpp_hipblas POST_BUILD
567+
COMMAND ${CMAKE_COMMAND} -E copy
568+
$<TARGET_FILE:koboldcpp_hipblas> # The generated DLL
569+
${CMAKE_SOURCE_DIR}/ # Destination directory
570+
COMMENT "Copying DLL to parent directory"
571+
)
547572
endif()
548573

Makefile

Lines changed: 21 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
.PHONY: finishedmsg
55

66
default: koboldcpp_default koboldcpp_failsafe koboldcpp_noavx2 koboldcpp_clblast koboldcpp_clblast_noavx2 koboldcpp_cublas koboldcpp_hipblas koboldcpp_vulkan koboldcpp_vulkan_noavx2 finishedmsg
7-
tools: quantize_gpt2 quantize_gptj quantize_gguf quantize_neox quantize_mpt quantize_clip whispermain sdmain gguf-split
7+
tools: quantize_gpt2 quantize_gptj quantize_gguf quantize_neox quantize_mpt quantize_clip ttsmain whispermain sdmain gguf-split
88

99
ifndef UNAME_S
1010
UNAME_S := $(shell uname -s)
@@ -90,10 +90,10 @@ endif
9090
CUBLASLD_FLAGS =
9191
CUBLAS_OBJS =
9292

93-
OBJS_FULL += ggml-alloc.o ggml-cpu-traits.o ggml-quants.o ggml-cpu-quants.o ggml-cpu-aarch64.o unicode.o unicode-data.o ggml-threading.o ggml-cpu-cpp.o gguf.o sgemm.o common.o sampling.o
94-
OBJS_SIMPLE += ggml-alloc.o ggml-cpu-traits.o ggml-quants_noavx2.o ggml-cpu-quants_noavx2.o ggml-cpu-aarch64_noavx2.o unicode.o unicode-data.o ggml-threading.o ggml-cpu-cpp.o gguf.o sgemm_noavx2.o common.o sampling.o
95-
OBJS_SIMPLER += ggml-alloc.o ggml-cpu-traits.o ggml-quants_noavx1.o ggml-cpu-quants_noavx1.o ggml-cpu-aarch64_noavx1.o unicode.o unicode-data.o ggml-threading.o ggml-cpu-cpp.o gguf.o sgemm_noavx1.o common.o sampling.o
96-
OBJS_FAILSAFE += ggml-alloc.o ggml-cpu-traits.o ggml-quants_failsafe.o ggml-cpu-quants_failsafe.o ggml-cpu-aarch64_failsafe.o unicode.o unicode-data.o ggml-threading.o ggml-cpu-cpp.o gguf.o sgemm_failsafe.o common.o sampling.o
93+
OBJS_FULL += ggml-alloc.o ggml-cpu-traits.o ggml-quants.o ggml-cpu-quants.o ggml-cpu-aarch64.o unicode.o unicode-data.o ggml-threading.o ggml-cpu-cpp.o gguf.o sgemm.o common.o sampling.o kcpputils.o
94+
OBJS_SIMPLE += ggml-alloc.o ggml-cpu-traits.o ggml-quants_noavx2.o ggml-cpu-quants_noavx2.o ggml-cpu-aarch64_noavx2.o unicode.o unicode-data.o ggml-threading.o ggml-cpu-cpp.o gguf.o sgemm_noavx2.o common.o sampling.o kcpputils.o
95+
OBJS_SIMPLER += ggml-alloc.o ggml-cpu-traits.o ggml-quants_noavx1.o ggml-cpu-quants_noavx1.o ggml-cpu-aarch64_noavx1.o unicode.o unicode-data.o ggml-threading.o ggml-cpu-cpp.o gguf.o sgemm_noavx1.o common.o sampling.o kcpputils.o
96+
OBJS_FAILSAFE += ggml-alloc.o ggml-cpu-traits.o ggml-quants_failsafe.o ggml-cpu-quants_failsafe.o ggml-cpu-aarch64_failsafe.o unicode.o unicode-data.o ggml-threading.o ggml-cpu-cpp.o gguf.o sgemm_failsafe.o common.o sampling.o kcpputils.o
9797

9898
# OS specific
9999
ifeq ($(UNAME_S),Linux)
@@ -539,6 +539,8 @@ ggml-cpu-cpp.o: ggml/src/ggml-cpu/ggml-cpu.cpp ggml/include/ggml.h ggml/src/ggml
539539
$(CXX) $(CXXFLAGS) -c $< -o $@
540540
gguf.o: ggml/src/gguf.cpp ggml/include/gguf.h
541541
$(CXX) $(CXXFLAGS) -c $< -o $@
542+
kcpputils.o: otherarch/utils.cpp otherarch/utils.h
543+
$(CXX) $(CXXFLAGS) -c $< -o $@
542544

543545
#these have special gpu defines
544546
ggml-backend_default.o: ggml/src/ggml-backend.cpp ggml/src/ggml-backend-impl.h ggml/include/ggml.h ggml/include/ggml-backend.h
@@ -639,8 +641,12 @@ whispercpp_default.o: otherarch/whispercpp/whisper_adapter.cpp
639641
whispercpp_cublas.o: otherarch/whispercpp/whisper_adapter.cpp
640642
$(CXX) $(CXXFLAGS) $(CUBLAS_FLAGS) $(HIPFLAGS) -c $< -o $@
641643

644+
#tts objects
645+
tts_default.o: otherarch/tts_adapter.cpp
646+
$(CXX) $(CXXFLAGS) -c $< -o $@
647+
642648
# idiotic "for easier compilation"
643-
GPTTYPE_ADAPTER = gpttype_adapter.cpp otherarch/llama_v2.cpp otherarch/llama_v3.cpp src/llama.cpp src/llama-impl.cpp src/llama-chat.cpp src/llama-mmap.cpp src/llama-context.cpp src/llama-adapter.cpp src/llama-arch.cpp src/llama-batch.cpp src/llama-vocab.cpp src/llama-grammar.cpp src/llama-sampling.cpp src/llama-kv-cache.cpp src/llama-model-loader.cpp src/llama-model.cpp src/llama-quant.cpp src/llama-hparams.cpp otherarch/utils.cpp otherarch/gptj_v1.cpp otherarch/gptj_v2.cpp otherarch/gptj_v3.cpp otherarch/gpt2_v1.cpp otherarch/gpt2_v2.cpp otherarch/gpt2_v3.cpp otherarch/rwkv_v2.cpp otherarch/rwkv_v3.cpp otherarch/neox_v2.cpp otherarch/neox_v3.cpp otherarch/mpt_v3.cpp ggml/include/ggml.h ggml/include/ggml-cpu.h ggml/include/ggml-cuda.h include/llama.h otherarch/llama-util.h
649+
GPTTYPE_ADAPTER = gpttype_adapter.cpp otherarch/llama_v2.cpp otherarch/llama_v3.cpp src/llama.cpp src/llama-impl.cpp src/llama-chat.cpp src/llama-mmap.cpp src/llama-context.cpp src/llama-adapter.cpp src/llama-arch.cpp src/llama-batch.cpp src/llama-vocab.cpp src/llama-grammar.cpp src/llama-sampling.cpp src/llama-kv-cache.cpp src/llama-model-loader.cpp src/llama-model.cpp src/llama-quant.cpp src/llama-hparams.cpp otherarch/gptj_v1.cpp otherarch/gptj_v2.cpp otherarch/gptj_v3.cpp otherarch/gpt2_v1.cpp otherarch/gpt2_v2.cpp otherarch/gpt2_v3.cpp otherarch/rwkv_v2.cpp otherarch/rwkv_v3.cpp otherarch/neox_v2.cpp otherarch/neox_v3.cpp otherarch/mpt_v3.cpp ggml/include/ggml.h ggml/include/ggml-cpu.h ggml/include/ggml-cuda.h include/llama.h otherarch/llama-util.h
644650
gpttype_adapter_failsafe.o: $(GPTTYPE_ADAPTER)
645651
$(CXX) $(CXXFLAGS) $(FAILSAFE_FLAGS) -c $< -o $@
646652
gpttype_adapter.o: $(GPTTYPE_ADAPTER)
@@ -680,30 +686,30 @@ vulkan-shaders-gen: ggml/src/ggml-vulkan/vulkan-shaders/vulkan-shaders-gen.cpp
680686
$(shell) vulkan-shaders-gen --glslc glslc --input-dir ggml/src/ggml-vulkan/vulkan-shaders --target-hpp ggml/src/ggml-vulkan-shaders.hpp --target-cpp ggml/src/ggml-vulkan-shaders.cpp
681687

682688
#generated libraries
683-
koboldcpp_default: ggml.o ggml-cpu.o ggml_v3.o ggml_v2.o ggml_v1.o expose.o gpttype_adapter.o sdcpp_default.o whispercpp_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_FULL) $(OBJS)
689+
koboldcpp_default: ggml.o ggml-cpu.o ggml_v3.o ggml_v2.o ggml_v1.o expose.o gpttype_adapter.o sdcpp_default.o whispercpp_default.o tts_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_FULL) $(OBJS)
684690
$(DEFAULT_BUILD)
685691

686692
ifdef FAILSAFE_BUILD
687-
koboldcpp_failsafe: ggml_v4_failsafe.o ggml-cpu_v4_failsafe.o ggml_v3_failsafe.o ggml_v2_failsafe.o ggml_v1_failsafe.o expose.o gpttype_adapter_failsafe.o sdcpp_default.o whispercpp_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_FAILSAFE) $(OBJS)
693+
koboldcpp_failsafe: ggml_v4_failsafe.o ggml-cpu_v4_failsafe.o ggml_v3_failsafe.o ggml_v2_failsafe.o ggml_v1_failsafe.o expose.o gpttype_adapter_failsafe.o sdcpp_default.o whispercpp_default.o tts_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_FAILSAFE) $(OBJS)
688694
$(FAILSAFE_BUILD)
689695
else
690696
koboldcpp_failsafe:
691697
$(DONOTHING)
692698
endif
693699

694700
ifdef NOAVX2_BUILD
695-
koboldcpp_noavx2: ggml_v4_noavx2.o ggml-cpu_v4_noavx2.o ggml_v3_noavx2.o ggml_v2_noavx2.o ggml_v1_failsafe.o expose.o gpttype_adapter_failsafe.o sdcpp_default.o whispercpp_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_SIMPLE) $(OBJS)
701+
koboldcpp_noavx2: ggml_v4_noavx2.o ggml-cpu_v4_noavx2.o ggml_v3_noavx2.o ggml_v2_noavx2.o ggml_v1_failsafe.o expose.o gpttype_adapter_failsafe.o sdcpp_default.o whispercpp_default.o tts_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_SIMPLE) $(OBJS)
696702
$(NOAVX2_BUILD)
697703
else
698704
koboldcpp_noavx2:
699705
$(DONOTHING)
700706
endif
701707

702708
ifdef CLBLAST_BUILD
703-
koboldcpp_clblast: ggml_v4_clblast.o ggml-cpu_v4_clblast.o ggml_v3_clblast.o ggml_v2_clblast.o ggml_v1.o expose.o gpttype_adapter_clblast.o ggml-opencl.o ggml_v3-opencl.o ggml_v2-opencl.o ggml_v2-opencl-legacy.o sdcpp_default.o whispercpp_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_FULL) $(OBJS)
709+
koboldcpp_clblast: ggml_v4_clblast.o ggml-cpu_v4_clblast.o ggml_v3_clblast.o ggml_v2_clblast.o ggml_v1.o expose.o gpttype_adapter_clblast.o ggml-opencl.o ggml_v3-opencl.o ggml_v2-opencl.o ggml_v2-opencl-legacy.o sdcpp_default.o whispercpp_default.o tts_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_FULL) $(OBJS)
704710
$(CLBLAST_BUILD)
705711
ifdef NOAVX2_BUILD
706-
koboldcpp_clblast_noavx2: ggml_v4_clblast_noavx2.o ggml-cpu_v4_clblast_noavx2.o ggml_v3_clblast_noavx2.o ggml_v2_clblast_noavx2.o ggml_v1_failsafe.o expose.o gpttype_adapter_clblast_noavx2.o ggml-opencl.o ggml_v3-opencl.o ggml_v2-opencl.o ggml_v2-opencl-legacy.o sdcpp_default.o whispercpp_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_SIMPLER) $(OBJS)
712+
koboldcpp_clblast_noavx2: ggml_v4_clblast_noavx2.o ggml-cpu_v4_clblast_noavx2.o ggml_v3_clblast_noavx2.o ggml_v2_clblast_noavx2.o ggml_v1_failsafe.o expose.o gpttype_adapter_clblast_noavx2.o ggml-opencl.o ggml_v3-opencl.o ggml_v2-opencl.o ggml_v2-opencl-legacy.o sdcpp_default.o whispercpp_default.o tts_default.o llavaclip_default.o llava.o ggml-backend_default.o ggml-backend-reg_default.o $(OBJS_SIMPLER) $(OBJS)
707713
$(CLBLAST_BUILD)
708714
else
709715
koboldcpp_clblast_noavx2:
@@ -717,26 +723,26 @@ koboldcpp_clblast_noavx2:
717723
endif
718724

719725
ifdef CUBLAS_BUILD
720-
koboldcpp_cublas: ggml_v4_cublas.o ggml-cpu.o ggml_v3_cublas.o ggml_v2_cublas.o ggml_v1.o expose.o gpttype_adapter_cublas.o sdcpp_cublas.o whispercpp_cublas.o llavaclip_cublas.o llava.o ggml-backend_cublas.o ggml-backend-reg_cublas.o $(CUBLAS_OBJS) $(OBJS_FULL) $(OBJS)
726+
koboldcpp_cublas: ggml_v4_cublas.o ggml-cpu.o ggml_v3_cublas.o ggml_v2_cublas.o ggml_v1.o expose.o gpttype_adapter_cublas.o sdcpp_cublas.o whispercpp_cublas.o tts_default.o llavaclip_cublas.o llava.o ggml-backend_cublas.o ggml-backend-reg_cublas.o $(CUBLAS_OBJS) $(OBJS_FULL) $(OBJS)
721727
$(CUBLAS_BUILD)
722728
else
723729
koboldcpp_cublas:
724730
$(DONOTHING)
725731
endif
726732

727733
ifdef HIPBLAS_BUILD
728-
koboldcpp_hipblas: ggml_v4_cublas.o ggml-cpu.o ggml_v3_cublas.o ggml_v2_cublas.o ggml_v1.o expose.o gpttype_adapter_cublas.o sdcpp_cublas.o whispercpp_cublas.o llavaclip_cublas.o llava.o ggml-backend_cublas.o ggml-backend-reg_cublas.o $(HIP_OBJS) $(OBJS_FULL) $(OBJS)
734+
koboldcpp_hipblas: ggml_v4_cublas.o ggml-cpu.o ggml_v3_cublas.o ggml_v2_cublas.o ggml_v1.o expose.o gpttype_adapter_cublas.o sdcpp_cublas.o whispercpp_cublas.o tts_default.o llavaclip_cublas.o llava.o ggml-backend_cublas.o ggml-backend-reg_cublas.o $(HIP_OBJS) $(OBJS_FULL) $(OBJS)
729735
$(HIPBLAS_BUILD)
730736
else
731737
koboldcpp_hipblas:
732738
$(DONOTHING)
733739
endif
734740

735741
ifdef VULKAN_BUILD
736-
koboldcpp_vulkan: ggml_v4_vulkan.o ggml-cpu.o ggml_v3.o ggml_v2.o ggml_v1.o expose.o gpttype_adapter_vulkan.o ggml-vulkan.o sdcpp_vulkan.o whispercpp_default.o llavaclip_vulkan.o llava.o ggml-backend_vulkan.o ggml-backend-reg_vulkan.o $(OBJS_FULL) $(OBJS)
742+
koboldcpp_vulkan: ggml_v4_vulkan.o ggml-cpu.o ggml_v3.o ggml_v2.o ggml_v1.o expose.o gpttype_adapter_vulkan.o ggml-vulkan.o sdcpp_vulkan.o whispercpp_default.o tts_default.o llavaclip_vulkan.o llava.o ggml-backend_vulkan.o ggml-backend-reg_vulkan.o $(OBJS_FULL) $(OBJS)
737743
$(VULKAN_BUILD)
738744
ifdef NOAVX2_BUILD
739-
koboldcpp_vulkan_noavx2: ggml_v4_vulkan_noavx2.o ggml-cpu_v4_noavx2.o ggml_v3_noavx2.o ggml_v2_noavx2.o ggml_v1_failsafe.o expose.o gpttype_adapter_vulkan_noavx2.o ggml-vulkan.o sdcpp_vulkan.o whispercpp_default.o llavaclip_vulkan.o llava.o ggml-backend_vulkan.o ggml-backend-reg_vulkan.o $(OBJS_SIMPLE) $(OBJS)
745+
koboldcpp_vulkan_noavx2: ggml_v4_vulkan_noavx2.o ggml-cpu_v4_noavx2.o ggml_v3_noavx2.o ggml_v2_noavx2.o ggml_v1_failsafe.o expose.o gpttype_adapter_vulkan_noavx2.o ggml-vulkan.o sdcpp_vulkan.o whispercpp_default.o tts_default.o llavaclip_vulkan.o llava.o ggml-backend_vulkan.o ggml-backend-reg_vulkan.o $(OBJS_SIMPLE) $(OBJS)
740746
$(VULKAN_BUILD)
741747
else
742748
koboldcpp_vulkan_noavx2:

expose.cpp

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -238,6 +238,15 @@ extern "C"
238238
return whispertype_generate(inputs);
239239
}
240240

241+
bool tts_load_model(const tts_load_model_inputs inputs)
242+
{
243+
return ttstype_load_model(inputs);
244+
}
245+
tts_generation_outputs tts_generate(const tts_generation_inputs inputs)
246+
{
247+
return ttstype_generate(inputs);
248+
}
249+
241250
const char * new_token(int idx) {
242251
if (generated_tokens.size() <= idx || idx < 0) return nullptr;
243252

expose.h

Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -139,6 +139,7 @@ struct last_logprobs_outputs {
139139
int count = 0;
140140
logprob_item * logprob_items = nullptr;
141141
};
142+
142143
struct sd_load_model_inputs
143144
{
144145
const char * model_filename = nullptr;
@@ -178,6 +179,7 @@ struct sd_generation_outputs
178179
int status = -1;
179180
const char * data = "";
180181
};
182+
181183
struct whisper_load_model_inputs
182184
{
183185
const char * model_filename = nullptr;
@@ -201,6 +203,30 @@ struct whisper_generation_outputs
201203
const char * text = "";
202204
};
203205

206+
struct tts_load_model_inputs
207+
{
208+
const char * ttc_model_filename = nullptr;
209+
const char * cts_model_filename = nullptr;
210+
const char * executable_path = nullptr;
211+
const int clblast_info = 0;
212+
const int cublas_info = 0;
213+
const char * vulkan_info = nullptr;
214+
const int gpulayers = 0;
215+
const int debugmode = 0;
216+
};
217+
struct tts_generation_inputs
218+
{
219+
const char * prompt = nullptr;
220+
const int speaker_seed = 0;
221+
const int audio_seed = 0;
222+
const bool quiet = false;
223+
};
224+
struct tts_generation_outputs
225+
{
226+
int status = -1;
227+
const char * data = "";
228+
};
229+
204230
extern std::string executable_path;
205231
extern std::string lora_filename;
206232
extern std::string lora_base;

ggml/src/gguf.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -383,7 +383,7 @@ struct gguf_context * gguf_init_from_file_impl(FILE * file, struct gguf_init_par
383383
}
384384

385385
if (ok && gr.read(n_kv_32)) {
386-
n_kv_32 = n_kv_32;
386+
n_kv = n_kv_32;
387387
} else {
388388
ok = false;
389389
}

0 commit comments

Comments
 (0)