ggerganov · Cyberhan123 · Oct 11, 2023 · Oct 12, 2023 · Oct 17, 2023
diff --git a/.gitignore b/.gitignore
@@ -35,3 +35,5 @@ zig-cache/
 *.sw?
 
 __pycache__/
+
+/docs/.vitepress/cache/
diff --git a/docs/.vitepress/config.mts b/docs/.vitepress/config.mts
@@ -0,0 +1,35 @@
+import {defineConfig} from 'vitepress'
+
+// https://vitepress.dev/reference/site-config
+export default defineConfig({
+    title: "ggml",
+    description: "Tensor library for machine learning",
+    themeConfig: {
+        // https://vitepress.dev/reference/default-theme-config
+        nav: [
+            {text: 'Guide', link: '/guide/get-start'},
+            {text: 'Reference', link: '/reference/markdown-examples'}
+        ],
+        sidebar: {
+            '/guide/': [
+                {
+                text: 'Introduction',
+                items: [
+                    {text: 'Getting Started', link: '/guide/get-start'},
+                ]
+            }
+            ],
+            '/reference/': [{
+                text: 'Reference',
+                items: [
+                    {text: 'Markdown Examples', link: '/markdown-examples'},
+                    {text: 'Runtime API Examples', link: '/api-examples'}
+                ]
+            }]
+        },
+
+        socialLinks: [
+            {icon: 'github', link: 'https://github.com/ggerganov/ggml'}
+        ]
+    }
+})
diff --git a/docs/guide/get-start.md b/docs/guide/get-start.md
@@ -0,0 +1,156 @@
+# Getting Started
+
+## Installation
+
+### Prerequisites
+
+- A compatible operating system (e.g. Linux, macOS, Windows).
+- A compatible C++ compiler that supports at least C++11.
+- [VSCode](https://code.visualstudio.com/), or other editor.
+- CMake or a compatible build tool for building the project.
+
+### Install with CMake
+
+If you don’t already have CMake installed, see the [CMake installation guide](https://cmake.org/resources).
+
+CMake uses a file named CMakeLists.txt to configure the build system for a project. You’ll use this file to set up your
+project and declare a dependency on ggml.
+
+```cmake
+cmake_minimum_required(VERSION 3.14)
+project(my_project)
+
+# ggml requires at least C++11
+set(CMAKE_CXX_STANDARD 11)
+set(CMAKE_CXX_STANDARD_REQUIRED ON)
+
+set(GGML_GIT_COMMIT_HASH ef336850d5bfe8237ebca1ec82cdfb97d78baff1)
+set(GGML_GIT_URL https://github.com/ggerganov/ggml.git)
+
+include(FetchContent)
+
+FetchContent_Declare(
+        ggml
+        GIT_REPOSITORY ${GGML_GIT_URL}
+        GIT_TAG ${GGML_GIT_COMMIT_HASH}
+)
+
+FetchContent_MakeAvailable(ggml)
+
+# include ggml .h file
+include_directories(${ggml_SOURCE_DIR}/include)
+```
+
+The above configuration declares a dependency on ggml which is downloaded from GitHub
+
+### Git Submodule
+
+You can add ggml as a submodule of your project. In your project repository:
+
+```sh
+git submodule add https://github.com/ggerganov/ggml ggml
+```
+
+## Create and run a binary
+
+With ggml declared as a dependency, you can use ggml code within your own project.
+
+As an example, create a file named hello_ggml.cpp in your project directory with the following contents:
+
+```c++
+#include <vector>
+#include <cstdio>
+
+#include "ggml/ggml.h"
+#include "ggml/ggml-alloc.h"
+#include "ggml/ggml-backend.h"
+
+const struct ggml_init_params params = {
+    /*.mem_size   =*/ ggml_tensor_overhead() * 10240,
+    /*.mem_buffer =*/ nullptr,
+    /*.no_alloc   =*/ true
+};
+int main(int argc, char ** argv) {
+    // init ggml_time total
+    ggml_time_init();
+    const auto t_main_start_us = ggml_time_us();
+    // create ggml ctx
+    const auto ctx = ggml_init(params);
+    // create ggml cpu backend
+    const auto backend = ggml_backend_cpu_init();
+    // create 1d tensor
+    const auto tensor_a = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, 1);
+    const auto tensor_b = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, 1);
+    auto tensor_c = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, 1);
+    std::vector<float> tensor_data_a = {1.0};
+    std::vector<float> tensor_data_b = {2.0};
+    std::vector<float> tensor_data_c;
+
+    const auto tensor_1d_memory_size = ggml_nbytes(tensor_a) + ggml_nbytes(tensor_b);
+    // create a backend buffer (can be in host or device memory)
+    const auto tensor_1d_buffer = ggml_backend_alloc_buffer(backend, tensor_1d_memory_size + 256);
+
+    // set value
+    {
+        const auto alloc = ggml_allocr_new_from_buffer(tensor_1d_buffer);
+        // this updates the pointers in the tensors to point to the correct location in the buffer
+        // this is necessary since the ggml_context is .no_alloc == true
+        // note that the buffer can actually be a device buffer, depending on the backend
+        ggml_allocr_alloc(alloc, tensor_a);
+        ggml_allocr_alloc(alloc, tensor_b);
+
+        // in cpu we also can do
+        // tensor_a->data = &tensor_data_a.data();
+        // tensor_b->data = &tensor_data_b.data();
+        ggml_backend_tensor_set(tensor_a, tensor_data_a.data(), 0, ggml_nbytes(tensor_a));
+        ggml_backend_tensor_set(tensor_b, tensor_data_b.data(), 0, ggml_nbytes(tensor_b));
+        ggml_allocr_free(alloc);
+    }
+
+    // compute
+    {
+        const auto compute_tensor_buffer = ggml_backend_alloc_buffer(backend, 656480);
+        const auto allocr = ggml_allocr_new_from_buffer(compute_tensor_buffer);
+        const auto gf = ggml_new_graph(ctx);
+
+        // creat forward
+        tensor_c = ggml_add(ctx, tensor_a, tensor_b);
+        ggml_build_forward_expand(gf, tensor_c);
+
+        // allocate tensors
+        ggml_allocr_alloc_graph(allocr, gf);
+
+        if (ggml_backend_is_cpu(backend)) {
+            ggml_backend_cpu_set_n_threads(backend, 1);
+        }
+
+        ggml_backend_graph_compute(backend, gf);
+
+        tensor_data_c.resize(1);
+        ggml_backend_tensor_get(gf->nodes[gf->n_nodes - 1], tensor_data_c.data(), 0,
+        tensor_data_c.size() * sizeof(float));
+        printf("result is = [");
+        for (auto i = tensor_data_c.begin(); i != tensor_data_c.end(); ++i) {
+            printf("%f ", *i);
+        }
+        printf("]\n");
+        ggml_allocr_free(allocr);
+    }
+
+    const auto t_main_end_us = ggml_time_us();
+
+    printf("total time = %8.2f ms\n", (t_main_end_us - t_main_start_us) / 1000.0f);
+
+    ggml_free(ctx);
+    ggml_backend_buffer_free(tensor_1d_buffer);
+    ggml_backend_free(backend);
+}
+```
+
+The result is 3.000000
+```sh 
+result is = [3.000000]
+total time =    10.93 ms
+Process finished with exit code 0
+```
+
diff --git a/docs/index.md b/docs/index.md
@@ -0,0 +1,28 @@
+---
+# https://vitepress.dev/reference/default-theme-home-page
+layout: home
+
+hero:
+  name: "ggml"
+  text: "Tensor library for machine learning"
+  tagline: ggml is a tensor library for machine learning to enable large models and high performance on commodity hardware. It is used by llama.cpp and whisper.cpp
+  actions:
+    - theme: brand
+      text: Get Start
+      link: /get-start
+    - theme: alt
+      text: API Examples
+      link: /api-examples
+
+features:
+  - title: Written in C
+  - title: 16-bit float support
+  - title: Integer quantization support (4-bit, 5-bit, 8-bit, etc.)
+  - title: ADAM and L-BFGS optimizers
+  - title: Optimized for Apple Silicon
+  - title: On x86 architectures utilizes AVX / AVX2 intrinsics
+  - title: On ppc64 architectures utilizes VSX intrinsics
+  - title: No third-party dependencies
+  - title: Zero memory allocations during runtime
+---
+
diff --git a/docs/package.json b/docs/package.json
@@ -0,0 +1,12 @@
+{
+  "name": "ggml-document",
+  "type": "module",
+  "scripts": {
+    "docs:dev": "vitepress dev",
+    "docs:build": "vitepress build",
+    "docs:preview": "vitepress preview"
+  },
+  "devDependencies": {
+    "vitepress": "1.0.0-rc.20"
+  }
+}