.dockerignore
.gitignore
.gitmodules
CMakeLists.txt
Dockerfile
Dockerfile.cuda
LICENSE.md
README.md
mkdocs.yml
poetry.lock
pyproject.toml
setup.py
.github/workflows/build-and-release.yaml
.github/workflows/build-docker.yaml
.github/workflows/publish-to-test.yaml
.github/workflows/publish.yaml
.github/workflows/test.yaml
docs/index.md
examples/high_level_api/fastapi_server.py
examples/high_level_api/high_level_api_embedding.py
examples/high_level_api/high_level_api_inference.py
examples/high_level_api/high_level_api_streaming.py
examples/high_level_api/langchain_custom_llm.py
examples/low_level_api/common.py
examples/low_level_api/low_level_api_chat_cpp.py
examples/low_level_api/low_level_api_llama_cpp.py
examples/low_level_api/quantize.py
examples/notebooks/Clients.ipynb
examples/notebooks/PerformanceTuning.ipynb
llama_cpp/__init__.py
llama_cpp/llama.py
llama_cpp/llama_cpp.py
llama_cpp/llama_types.py
llama_cpp/server/__init__.py
llama_cpp/server/__main__.py
llama_cpp/server/app.py
llama_cpp_python.egg-info/PKG-INFO
llama_cpp_python.egg-info/SOURCES.txt
llama_cpp_python.egg-info/dependency_links.txt
llama_cpp_python.egg-info/requires.txt
llama_cpp_python.egg-info/top_level.txt
tests/test_llama.py
vendor/llama.cpp/.dockerignore
vendor/llama.cpp/.ecrc
vendor/llama.cpp/.editorconfig
vendor/llama.cpp/.gitignore
vendor/llama.cpp/CMakeLists.txt
vendor/llama.cpp/LICENSE
vendor/llama.cpp/Makefile
vendor/llama.cpp/Package.swift
vendor/llama.cpp/README.md
vendor/llama.cpp/SHA256SUMS
vendor/llama.cpp/build.zig
vendor/llama.cpp/convert-lora-to-ggml.py
vendor/llama.cpp/convert-pth-to-ggml.py
vendor/llama.cpp/convert.py
vendor/llama.cpp/flake.lock
vendor/llama.cpp/flake.nix
vendor/llama.cpp/ggml-cuda.cu
vendor/llama.cpp/ggml-cuda.h
vendor/llama.cpp/ggml-opencl.c
vendor/llama.cpp/ggml-opencl.h
vendor/llama.cpp/ggml.c
vendor/llama.cpp/ggml.h
vendor/llama.cpp/llama-util.h
vendor/llama.cpp/llama.cpp
vendor/llama.cpp/llama.h
vendor/llama.cpp/requirements.txt
vendor/llama.cpp/.devops/full.Dockerfile
vendor/llama.cpp/.devops/main.Dockerfile
vendor/llama.cpp/.devops/tools.sh
vendor/llama.cpp/.github/ISSUE_TEMPLATE/custom.md
vendor/llama.cpp/.github/workflows/build.yml
vendor/llama.cpp/.github/workflows/docker.yml
vendor/llama.cpp/.github/workflows/editorconfig.yml
vendor/llama.cpp/examples/CMakeLists.txt
vendor/llama.cpp/examples/Miku.sh
vendor/llama.cpp/examples/alpaca.sh
vendor/llama.cpp/examples/chat-13B.bat
vendor/llama.cpp/examples/chat-13B.sh
vendor/llama.cpp/examples/chat.sh
vendor/llama.cpp/examples/common.cpp
vendor/llama.cpp/examples/common.h
vendor/llama.cpp/examples/gpt4all.sh
vendor/llama.cpp/examples/reason-act.sh
vendor/llama.cpp/examples/benchmark/CMakeLists.txt
vendor/llama.cpp/examples/benchmark/benchmark-matmult.cpp
vendor/llama.cpp/examples/embedding/CMakeLists.txt
vendor/llama.cpp/examples/embedding/README.md
vendor/llama.cpp/examples/embedding/embedding.cpp
vendor/llama.cpp/examples/jeopardy/README.md
vendor/llama.cpp/examples/jeopardy/graph.py
vendor/llama.cpp/examples/jeopardy/jeopardy.sh
vendor/llama.cpp/examples/jeopardy/qasheet.csv
vendor/llama.cpp/examples/jeopardy/questions.txt
vendor/llama.cpp/examples/main/CMakeLists.txt
vendor/llama.cpp/examples/main/README.md
vendor/llama.cpp/examples/main/main.cpp
vendor/llama.cpp/examples/perplexity/CMakeLists.txt
vendor/llama.cpp/examples/perplexity/README.md
vendor/llama.cpp/examples/perplexity/perplexity.cpp
vendor/llama.cpp/examples/quantize/CMakeLists.txt
vendor/llama.cpp/examples/quantize/README.md
vendor/llama.cpp/examples/quantize/quantize.cpp
vendor/llama.cpp/examples/quantize-stats/CMakeLists.txt
vendor/llama.cpp/examples/quantize-stats/quantize-stats.cpp
vendor/llama.cpp/examples/save-load-state/CMakeLists.txt
vendor/llama.cpp/examples/save-load-state/save-load-state.cpp
vendor/llama.cpp/media/llama-leader.jpeg
vendor/llama.cpp/media/llama0-banner.png
vendor/llama.cpp/media/llama0-logo.png
vendor/llama.cpp/media/llama1-banner.png
vendor/llama.cpp/media/llama1-logo.png
vendor/llama.cpp/models/ggml-vocab.bin
vendor/llama.cpp/pocs/CMakeLists.txt
vendor/llama.cpp/pocs/vdot/CMakeLists.txt
vendor/llama.cpp/pocs/vdot/q8dot.cpp
vendor/llama.cpp/pocs/vdot/vdot.cpp
vendor/llama.cpp/prompts/alpaca.txt
vendor/llama.cpp/prompts/chat-with-bob.txt
vendor/llama.cpp/prompts/chat-with-vicuna-v0.txt
vendor/llama.cpp/prompts/chat-with-vicuna-v1.txt
vendor/llama.cpp/prompts/chat.txt
vendor/llama.cpp/prompts/dan.txt
vendor/llama.cpp/prompts/reason-act.txt
vendor/llama.cpp/scripts/build-info.cmake
vendor/llama.cpp/scripts/build-info.h.in
vendor/llama.cpp/scripts/build-info.sh
vendor/llama.cpp/scripts/sync-ggml.sh
vendor/llama.cpp/scripts/verify-checksum-models.py
vendor/llama.cpp/spm-headers/llama.h
vendor/llama.cpp/tests/CMakeLists.txt
vendor/llama.cpp/tests/test-double-float.c
vendor/llama.cpp/tests/test-quantize-fns.cpp
vendor/llama.cpp/tests/test-quantize-perf.cpp
vendor/llama.cpp/tests/test-sampling.cpp
vendor/llama.cpp/tests/test-tokenizer-0.cpp