Commit 89927d4
- .devops/cann.Dockerfile+1
- .devops/cpu.Dockerfile+1
- .devops/cuda.Dockerfile+1
- .devops/intel.Dockerfile+1
- .devops/musa.Dockerfile+1
- .devops/openvino.Dockerfile+1
- .devops/rocm.Dockerfile+1
- .devops/s390x.Dockerfile+6-3
- .devops/vulkan.Dockerfile+1
- .github/ISSUE_TEMPLATE/011-bug-results.yml+2-2
- .github/ISSUE_TEMPLATE/019-bug-misc.yml+2-2
- .github/workflows/build-and-test-snapdragon.yml+2-2
- CMakeLists.txt+14-8
- app/CMakeLists.txt+11
- app/llama.cpp+67
- common/arg.cpp+2-1
- common/common.cpp+2-2
- convert_hf_to_gguf.py+3-3
- docs/backend/snapdragon/CMakeUserPresets.json+4-4
- docs/backend/snapdragon/README.md+1-1
- ggml/src/ggml-cuda/CMakeLists.txt+2-1
- ggml/src/ggml-cuda/binbcast.cu+14-18
- ggml/src/ggml-cuda/common.cuh+86
- ggml/src/ggml-cuda/concat.cu+3-2
- ggml/src/ggml-cuda/cpy.cu+14-6
- ggml/src/ggml-cuda/fattn-common.cuh+18-10
- ggml/src/ggml-cuda/fattn-mma-f16.cuh+1
- ggml/src/ggml-cuda/fattn-tile.cuh+2
- ggml/src/ggml-cuda/fattn-vec.cuh+3
- ggml/src/ggml-cuda/fattn-wmma-f16.cu+1
- ggml/src/ggml-cuda/gated_delta_net.cu+7-4
- ggml/src/ggml-cuda/getrows.cu+6-1
- ggml/src/ggml-cuda/mean.cu+4-2
- ggml/src/ggml-cuda/mmvf.cu+8-4
- ggml/src/ggml-cuda/mmvq.cu+9-4
- ggml/src/ggml-cuda/norm.cu+36-10
- ggml/src/ggml-cuda/quantize.cu+6-1
- ggml/src/ggml-cuda/reduce_rows.cuh+2
- ggml/src/ggml-cuda/rope.cu+11-4
- ggml/src/ggml-cuda/scale.cu+4-1
- ggml/src/ggml-cuda/set-rows.cu+8-3
- ggml/src/ggml-cuda/softcap.cu+4-1
- ggml/src/ggml-cuda/ssm-conv.cu+6-2
- ggml/src/ggml-cuda/ssm-scan.cu+16-11
- ggml/src/ggml-cuda/sumrows.cu+8-4
- ggml/src/ggml-cuda/topk-moe.cu+25-22
- ggml/src/ggml-cuda/unary.cu+8-2
- ggml/src/ggml-hexagon/ggml-hexagon.cpp+3-4
- ggml/src/ggml-hexagon/htp/htp-ops.h+1
- ggml/src/ggml-hexagon/htp/main.c+1
- ggml/src/ggml-hexagon/htp/rope-ops.c+97-18
- ggml/src/ggml-hexagon/htp/unary-ops.c+97
- ggml/src/ggml-metal/ggml-metal-device.cpp+7-1
- ggml/src/ggml-metal/ggml-metal-ops.cpp+11-6
- ggml/src/ggml-metal/ggml-metal.metal+72-56
- ggml/src/ggml-opencl/CMakeLists.txt+6
- ggml/src/ggml-opencl/ggml-opencl.cpp+940-8
- ggml/src/ggml-opencl/kernels/cvt.cl+385
- ggml/src/ggml-opencl/kernels/gemm_moe_q4_k_f32_ns.cl+279
- ggml/src/ggml-opencl/kernels/gemm_moe_q5_k_f32_ns.cl+284
- ggml/src/ggml-opencl/kernels/gemm_moe_q6_k_f32_ns.cl+263
- ggml/src/ggml-opencl/kernels/gemv_moe_q4_k_f32_ns.cl+151
- ggml/src/ggml-opencl/kernels/gemv_moe_q5_k_f32_ns.cl+156
- ggml/src/ggml-opencl/kernels/gemv_moe_q6_k_f32_ns.cl+137
- src/models/delta-net-base.cpp+4-4
- src/models/qwen35.cpp+2-1
- tools/cli/CMakeLists.txt+14-4
- tools/cli/cli.cpp+4-1
- tools/cli/main.cpp+5
- tools/completion/CMakeLists.txt+14-2
- tools/completion/completion.cpp+4-1
- tools/completion/main.cpp+5
- tools/fit-params/fit-params.cpp+1-1
- tools/llama-bench/CMakeLists.txt+14-2
- tools/llama-bench/llama-bench.cpp+4-1
- tools/llama-bench/main.cpp+5
- tools/mtmd/clip.cpp+24-21
- tools/mtmd/clip.h+5-2
- tools/mtmd/mtmd.cpp+101-45
- tools/mtmd/mtmd.h+9
- tools/server/CMakeLists.txt+13-9
- tools/server/main.cpp+5
- tools/server/server-context.cpp+44-12
- tools/server/server.cpp+4-1
- tools/ui/src/lib/components/app/chat/ChatForm/ChatFormActions/ChatFormActionAdd/ChatFormActionsAdd.svelte+1-3
- tools/ui/src/lib/components/app/chat/ChatForm/ChatFormActions/ChatFormActionModels.svelte+1-3
- tools/ui/src/lib/components/app/chat/ChatScreen/ChatScreen.svelte+26-49
- tools/ui/src/lib/components/app/chat/ChatScreen/ChatScreenActionScrollDown.svelte+17-4
- tools/ui/src/lib/components/app/chat/ChatScreen/ChatScreenGreeting.svelte+25
- tools/ui/src/lib/components/app/chat/ChatScreen/ChatScreenProcessingInfo.svelte+14-2
- tools/ui/src/lib/components/app/chat/ChatScreen/ChatScreenServerError.svelte+34
- tools/ui/src/lib/components/app/chat/index.ts+7
- tools/ui/src/lib/components/ui/sidebar/context.svelte.ts+2-4
- tools/ui/src/lib/hooks/is-mobile.svelte.ts-8
- tools/ui/src/lib/services/chat.service.ts+20-20
- tools/ui/src/lib/stores/settings.svelte.ts+2-3
- tools/ui/src/lib/stores/viewport.svelte.ts+9
- tools/ui/src/routes/+layout.svelte+4-4
0 commit comments