Skip to content

Commit 3d0c97d

Browse files
committed
Add quantize support for Falcon 180B models
1 parent 0f89d32 commit 3d0c97d

File tree

2 files changed

+10
-1
lines changed

2 files changed

+10
-1
lines changed

rebuild_llama.cpp.ps1

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -95,6 +95,15 @@ git submodule update --remote --merge --force
9595
# of the repository to enable quick debugging.
9696
git -C ./vendor/llama.cpp checkout $version
9797

98+
# Until https://github.com/ggerganov/llama.cpp/pull/3049 is resolved
99+
# we are adding the working falcon 180B convert script directly.
100+
if (-not(Test-Path -Path "./vendor/llama.cpp/convert-falcon180-hf-to-gguf.py")) {
101+
102+
Invoke-WebRequest `
103+
-Uri "https://raw.githubusercontent.com/ggerganov/llama.cpp/3a26b3c310ad210d21684f0e222505939eb34259/convert-falcon180-hf-to-gguf.py" `
104+
-OutFile "./vendor/llama.cpp/convert-falcon180-hf-to-gguf.py"
105+
}
106+
98107
$lines = @(
99108
"# This is a workaround for a CMake bug on Windows to build llama.cpp"
100109
"# with OpenBLAS. The find_package(BLAS) call fails to find OpenBLAS,"

vendor/llama.cpp

0 commit comments

Comments
 (0)