Distribute and run LLMs with a single file.
627 matches across 12 categories. Click a row to expand file-level details.
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | diffusionfile/diffusionfile.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llama.cpp.patches/fetch-ui-assets.sh | 1 | #!/bin/bash |
| LOW | llama.cpp.patches/renames.sh | 1 | #!/usr/bin/env bash |
| LOW | tests/fa_helpers_test.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | tests/fa_helpers_test.cpp | 21 | // These tests compare our AVX-512-optimized llamafile_fa_* helpers |
| LOW | tests/fa_helpers_test.cpp | 41 | #include <vector> |
| LOW | tests/extract_data_uris_test.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | tests/integration/run_tests.sh | 1 | #!/bin/bash |
| LOW | tests/sgemm/iqk_legacy_test.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | tests/sgemm/sgemm_test_utils.h | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | tests/sgemm/sgemm_test_utils.h | 201 | |
| LOW | tests/sgemm/sgemm_vecdot_test.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | tests/sgemm/sgemm_vecdot_test.cpp | 21 | // ============================================================================ |
| LOW | tests/sgemm/sgemm_vecdot_test.cpp | 41 | // - Both implementations tend to perform similarly here since memory is |
| LOW | tests/sgemm/sgemm_vecdot_test.cpp | 61 | // - Lower is better |
| LOW | tests/sgemm/sgemm_matmul_test.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | tests/sgemm/sgemm_matmul_test.cpp | 21 | // ============================================================================ |
| LOW | tests/sgemm/sgemm_matmul_test.cpp | 41 | // |
| LOW | tests/sgemm/sgemm_matmul_test.cpp | 61 | // Accuracy (ULP = Units in Last Place): |
| LOW | tests/sgemm/q8_0_layout_test.cpp | 1 | // q8_0_layout_test: Diagnostic for block_q8_0 vs block_q8_0_x4 memory layout |
| LOW | tests/sgemm/sgemm_sss_test.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | tests/sgemm/sgemm_sss_test.cpp | 21 | // ============================================================================ |
| LOW | tests/sgemm/sgemm_sss_test.cpp | 41 | // - Single-precision accumulation |
| LOW | tests/sgemm/sgemm_sss_test.cpp | 61 | // - "ulp average": Mean ULP difference across all output elements |
| LOW | tests/sgemm/iqk_test.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | tests/sgemm/iqk_test.cpp | 21 | // ============================================================================ |
| LOW | tests/sgemm/iqk_test.cpp | 41 | // - Prompt processing involves large matrix multiplications with these types |
| LOW | tests/sgemm/iqk_test.cpp | 61 | // METRICS: |
| LOW | tests/sgemm/iqk_test.cpp | 81 | #include "ggml.h" |
| LOW | tests/strsm/build_and_run.sh | 1 | #!/bin/bash |
| LOW | llamafile/tinyblas_cpu_sgemm_amd_fma.cpp | 1 | #ifdef __x86_64__ |
| LOW | llamafile/cuda.sh | 1 | #!/bin/bash |
| LOW | llamafile/cuda.sh | 21 | # |
| LOW | llamafile/tinyblas_cpu_sgemm_amd_avx2.cpp | 1 | #ifdef __x86_64__ |
| LOW | llamafile/tinyblas_cpu_mixmul_amd_avx2.cpp | 1 | #ifdef __x86_64__ |
| LOW | llamafile/chatbot_file.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/version.h | 1 | // -*- mode:c;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/version.h | 21 | #define LLAMAFILE_MAJOR 0 |
| LOW | llamafile/xterm.h | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/args.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/tinyblas_cpu_mixmul_amd_avx512f.cpp | 1 | #ifdef __x86_64__ |
| LOW | llamafile/image.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/tinyblas_cpu_mixmul_amd_fma.cpp | 1 | #ifdef __x86_64__ |
| LOW | llamafile/datauri.h | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/llama.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/zip.c | 1 | // -*- mode:c;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/fa_helpers_amd_avx512f.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/chatbot_comm.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/cuda.c | 1 | // -*- mode:c;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/cuda.c | 21 | // |
| LOW | llamafile/cuda.c | 41 | #include <sys/stat.h> |
| LOW | llamafile/chatbot_hist.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/compute.h | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/tinyblas_cpu_unsupported.cpp | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/tinyblas-compat.h | 1 | // -*- mode:c++;indent-tabs-mode:nil;c-basic-offset:4;coding:utf-8 -*- |
| LOW | llamafile/tinyblas-compat.h | 21 | // |
| LOW | llamafile/tinyblas-compat.h | 41 | |
| LOW | llamafile/tinyblas-compat.h | 61 | #define cublasSgemmStridedBatched tinyblasSgemmStridedBatched |
| LOW | llamafile/tinyblas-compat.h | 81 | #define CUBLAS_STATUS_INVALID_VALUE TINYBLAS_STATUS_INVALID_VALUE |
| LOW | llamafile/tinyblas-compat.h | 101 | #define CUDA_R_32F TINYBLAS_R_32F |
| 512 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| HIGH | third_party/mbedtls/error.c | 88 | /* Begin Auto-Generated Code. */ |
| HIGH | third_party/mbedtls/error.c | 422 | /* End Auto-Generated Code. */ |
| HIGH | third_party/mbedtls/error.c | 443 | /* Begin Auto-Generated Code. */ |
| HIGH | third_party/mbedtls/error.c | 634 | /* End Auto-Generated Code. */ |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tests/integration/tests/test_tool_calling.py | 88 | def test_tool_call_correct_function(self, llamafile, server_port, timeouts): |
| LOW | tests/integration/tests/test_tool_calling.py | 119 | def test_tool_call_with_arguments(self, llamafile, server_port, timeouts): |
| LOW | tests/integration/tests/test_multimodal.py | 48 | def test_cli_multiple_images_with_markers(self, llamafile, mmproj, test_image, timeouts): |
| LOW | tests/integration/tests/test_multimodal.py | 60 | def test_cli_multiple_images_marker_mismatch(self, llamafile, mmproj, test_image, timeouts): |
| LOW | tests/integration/tests/test_multimodal.py | 124 | def test_server_describe_image(self, llamafile, mmproj, test_image, server_port, timeouts): |
| LOW | tests/integration/tests/test_multimodal.py | 149 | def test_server_image_question(self, llamafile, mmproj, test_image, server_port, timeouts): |
| LOW | tests/integration/tests/test_server.py | 12 | def test_server_starts_and_responds(self, llamafile, server_port, timeouts): |
| LOW | tests/integration/tests/test_server.py | 25 | def test_server_chat_completion(self, llamafile, server_port, timeouts): |
| LOW | tests/integration/tests/test_server.py | 50 | def test_server_chat_completion_math(self, llamafile, server_port, timeouts): |
| LOW | tests/integration/tests/test_server.py | 81 | def test_server_with_temperature_zero(self, llamafile, server_port, timeouts): |
| LOW | tests/integration/tests/test_server.py | 127 | def test_server_with_max_tokens(self, llamafile, server_port, timeouts): |
| LOW | tests/integration/tests/test_combined.py | 14 | def test_combined_server_responds(self, llamafile, server_port, timeouts): |
| LOW | tests/integration/tests/test_combined.py | 36 | def test_combined_tui_and_server_simultaneously(self, llamafile, server_port, timeouts): |
| LOW | tests/integration/tests/test_cli.py | 48 | def test_nothink_removes_thinking(self, llamafile, timeouts): |
| LOW | tests/integration/tests/test_cli.py | 59 | def test_nothink_shorter_output(self, llamafile, timeouts): |
| LOW | tests/integration/tests/test_tui.py | 10 | def test_tui_responds_to_hello(self, llamafile, tmp_path, timeouts): |
| LOW | tests/integration/tests/test_tui.py | 58 | def test_tui_thinking_visible(self, llamafile, tmp_path, timeouts): |
| LOW | tests/integration/utils/llamafile.py | 476 | def chat_completion_streaming( |
| LOW | tests/integration/utils/llamafile.py | 554 | def chat_completion_with_image( |
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | llamafile/tinyblas_cpu.h | 25 | // ╚═╝ ╚═╝╚═╝ ╚═╝ ╚══╝ ╚═════╝ ╚═══╝╚═╝ ╚═╝╚═════╝ |
| MEDIUM | scripts/validate_docs.py | 22 | # ── helpers ────────────────────────────────────────────────────────────────── |
| MEDIUM | scripts/validate_docs.py | 32 | # ── 1. .gitbook.yaml ───────────────────────────────────────────────────────── |
| MEDIUM | scripts/validate_docs.py | 61 | # ── 2. SUMMARY.md links ─────────────────────────────────────────────────────── |
| MEDIUM | scripts/validate_docs.py | 89 | # ── 3. Relative links inside markdown files ─────────────────────────────────── |
| MEDIUM | scripts/validate_docs.py | 115 | # ── main ───────────────────────────────────────────────────────────────────── |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tools/generate_patches.sh | 103 | # Check if the diff is empty |
| LOW | llama.cpp.patches/apply-patches.sh | 13 | # Check if status is dirty, if so, exit |
| LOW | tests/integration/tests/test_tool_calling.py | 73 | # Check if model made a tool call |
| LOW | whisper.cpp.patches/apply-patches.sh | 13 | # Check if status is dirty, if so, exit |
| LOW | stable-diffusion.cpp.patches/apply-patches.sh | 13 | # Check if status is dirty, if so, exit |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tests/integration/run_tests.sh | 4 | # Usage: |
| LOW | tests/strsm/build_and_run.sh | 21 | # Usage: |
| LOW | llamafile/cuda.sh | 25 | # Usage: |
| LOW | llamafile/rocm.sh | 25 | # Usage: |
| LOW | llamafile/vulkan.sh | 21 | # Usage: |
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | localscore/nvml.cpp | 129 | // TODO we need a more robust way to import symbols and versions. |
| MEDIUM | third_party/stb/stb_vorbis.c | 51 | // 1.10 - 2017-03-03 - more robust seeking; fix negative ilog(); clear error in open_memory |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tests/integration/tests/test_gpu.py | 13 | |
| LOW | tests/integration/tests/test_gpu.py | 48 | |
| LOW | tests/integration/utils/llamafile.py | 19 | |
| LOW | tests/integration/utils/llamafile.py | 476 | |
| LOW | scripts/validate_docs.py | 94 |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | tests/integration/tests/test_gpu.py | 27 | except Exception: |
| LOW | tests/integration/tests/test_gpu.py | 38 | except Exception: |
| LOW | tests/integration/utils/llamafile.py | 82 | except Exception: |
| LOW | scripts/validate_docs.py | 44 | except Exception: |
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | llamafile/build-functions.sh | 22 | # This file contains common functions used by cuda.sh and rocm.sh |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | scripts/publish_docs.py | 10 | |
| LOW | scripts/validate_docs.py | 14 |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | .github/ISSUE_TEMPLATE/07-refactor.yml | 9 | Don't forget to [check for existing refactor issue tickets](https://github.com/Mozilla-Ocho/llamafile/issues?q=i |
| LOW | .github/ISSUE_TEMPLATE/06-refactor.yml | 9 | Don't forget to [check for existing refactor issue tickets](https://github.com/Mozilla-Ocho/llamafile/issues?q=i |