From ef6806da5186c9edf9473a35f1f2b3884cc8117f Mon Sep 17 00:00:00 2001
From: Ruihang Lai <ruihangl@cs.cmu.edu>
Date: Sat, 16 Nov 2024 13:29:17 -0500
Subject: [PATCH] [Docs] README revamp and documentation initialization

This PR sets up the XGrammar documentation and reorganizes the README.
---
 .github/workflows/documentation.yaml          |  42 ++++
 README.md                                     | 199 +++++-------------
 docs/.gitignore                               |   1 +
 docs/Makefile                                 |  20 ++
 docs/README.md                                |  30 +++
 .../img/mlc-logo-with-text-landscape.svg      |  87 ++++++++
 docs/conf.py                                  | 102 +++++++++
 docs/index.rst                                |  32 +++
 docs/make.bat                                 |  35 +++
 docs/requirements.txt                         |   8 +
 docs/start/install.rst                        |  95 +++++++++
 docs/start/quick_start.rst                    |  17 ++
 docs/tutorials/json_generation.rst            | 199 ++++++++++++++++++
 scripts/build_site.sh                         |  10 +
 scripts/gh_deploy_site.sh                     |  20 ++
 15 files changed, 745 insertions(+), 152 deletions(-)
 create mode 100644 .github/workflows/documentation.yaml
 create mode 100644 docs/.gitignore
 create mode 100644 docs/Makefile
 create mode 100644 docs/README.md
 create mode 100644 docs/_static/img/mlc-logo-with-text-landscape.svg
 create mode 100644 docs/conf.py
 create mode 100644 docs/index.rst
 create mode 100644 docs/make.bat
 create mode 100644 docs/requirements.txt
 create mode 100644 docs/start/install.rst
 create mode 100644 docs/start/quick_start.rst
 create mode 100644 docs/tutorials/json_generation.rst
 create mode 100644 scripts/build_site.sh
 create mode 100644 scripts/gh_deploy_site.sh

diff --git a/.github/workflows/documentation.yaml b/.github/workflows/documentation.yaml
new file mode 100644
index 0000000..9c5e1ce
--- /dev/null
+++ b/.github/workflows/documentation.yaml
@@ -0,0 +1,42 @@
+name: Build Docs
+
+on:
+  push:
+    branches:
+      - main
+  pull_request:
+    branches:
+      - main
+
+jobs:
+  test_linux:
+    name: Deploy Docs
+    runs-on: ubuntu-latest
+
+    steps:
+    - uses: actions/checkout@v2
+      with:
+        submodules: recursive
+
+    - name: Configuring build Environment
+      run: |
+        sudo apt-get update
+        python -m pip install -U pip wheel
+
+    - name: Setup Ruby
+      uses: ruby/setup-ruby@v1
+      with:
+        ruby-version: '3.0'
+
+    - name: Installing dependencies
+      run: |
+        python -m pip install -r docs/requirements.txt
+        gem install jekyll jekyll-remote-theme
+
+    - name: Deploying on GitHub Pages
+      if: github.ref == 'refs/heads/main'
+      run: |
+        git remote set-url origin https://x-access-token:${{ secrets.MLC_GITHUB_TOKEN }}@github.com/$GITHUB_REPOSITORY
+        git config --global user.email "mlc-gh-actions-bot@nomail"
+        git config --global user.name "mlc-gh-actions-bot"
+        ./scripts/gh_deploy_site.sh
diff --git a/README.md b/README.md
index 98d9701..252d1a2 100644
--- a/README.md
+++ b/README.md
@@ -1,152 +1,47 @@
-## XGrammar
-
-Cross-platform Near-zero Overhead Grammar-guided Generation for LLMs
-
-- G1: Universal: support any common tokenizer, and common grammar
-- G2: Efficient: Grammar should not cause additional burden for generation
-- G3: Cross-platform: pure C++ impl, portable for every platform, construct E2E pipeline on every platform
-- G4: Easy to understand and maintain
-
-This project is under active development.
-
-### Compile and Install
-
-```bash
-# install requirements
-sudo apt install cmake
-python3 -m pip install ninja pybind11 torch
-
-# build XGrammar core and Python bindings
-# see scripts/config.cmake for configuration options
-mkdir build
-cd build
-# specify your own CUDA architecture
-cmake .. -G Ninja -DXGRAMMAR_CUDA_ARCHITECTURES=89
-ninja
-
-# install Python package
-cd ../python
-python3 -m pip install .
-
-# optional: add the python directory to PATH
-echo "export PATH=\$PATH:$(pwd)" >> ~/.bashrc
-```
-
-### Python Usage Guide
-
-#### Step 1:Construction of grammar
-
-```python
-from xgrammar import BNFGrammar, BuiltinGrammar
-from pydantic import BaseModel
-
-# Method 1: provide a GBNF grammar string
-# For specification, see https://github.com/ggerganov/llama.cpp/blob/master/grammars/README.md
-gbnf_grammar = """
-root  ::= (expr "=" term "\n")+
-expr  ::= term ([-+*/] term)*
-term  ::= num | "(" expr ")"
-num   ::= [0-9]+
-"""
-
-gbnf_grammar = BNFGrammar(gbnf_grammar)
-
-# Method 2: unconstrained JSON
-json_grammar = BuiltinGrammar.json()
-
-# Method 3: provide a Pydantic model
-class Person(BaseModel):
-    name: str
-    age: int
-json_schema_pydantic = BuiltinGrammar.json_schema(Person)
-
-# Method 4: provide a JSON schema string
-person_schema = {
-  "title": "Person",
-  "type": "object",
-  "properties": {
-    "name": {
-      "type": "string"
-    },
-    "age": {
-      "type": "integer",
-    }
-  },
-  "required": ["name", "age"]
-}
-json_schema_str = BuiltinGrammar.json_schema(json.dumps(person_schema))
-```
-
-#### Step 2: Compiling grammars
-The compilation is multi-threaded and cached for every grammar.
-
-```python
-from xgrammar import TokenizerInfo, CachedGrammarCompiler, CompiledGrammar, GrammarMatcher
-from transformers import AutoTokenizer
-
-# 1. Convert huggingface tokenizer to TokenizerInfo (once per model)
-tokenizer = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
-tokenizer_info = TokenizerInfo.from_huggingface(tokenizer)
-```
-
-Method 1: Use CachedGrammarCompiler to avoid compile grammar multiple times
-```python
-# 2. Construct CachedGrammarCompiler (once per model)
-compiler = CachedGrammarCompiler(tokenizer_info, max_threads=8)
-
-# 3. Fetch CompiledGrammar and construct GrammarMatcher (once per request)
-compiled_grammar = compiler.compile_json_schema(json_schema_str)
-matcher = GrammarMatcher(compiled_grammar)
-```
-
-Method 2: Compile grammar directly
-```python
-# 2. Construct CompiledGrammar directly (once per grammar)
-compiled_grammar = CompiledGrammar(grammar, tokenizer_info, max_threads=8)
-
-# 3. Construct GrammarMatcher (once per request)
-matcher = GrammarMatcher(compiled_grammar)
-```
-
-#### Step 3: Grammar-guided generation
-
-For single-batch generation:
-```python
-import torch
-
-token_bitmask = GrammarMatcher.allocate_token_bitmask(matcher.vocab_size)
-while True:
-    logits = LLM.inference() # logits is a tensor of shape (vocab_size,) on GPU
-    matcher.fill_next_token_bitmask(logits, token_bitmask)
-    GrammarMatcher.apply_token_bitmask_inplace(logits, token_bitmask)
-
-    prob = torch.softmax(logits, dim=-1) # get probability from logits
-    next_token_id = Sampler.sample(logits) # use your own sampler
-
-    matcher.accept_token(next_token_id)
-    if matcher.is_terminated(): # or your own termination condition
-        break
-```
-
-For multi-batch generation:
-```python
-import torch
-
-matchers: List[GrammarMatcher] # The grammar matcher for every request
-token_bitmasks = GrammarMatcher.allocate_token_bitmask(matchers[0].vocab_size, batch_size)
-while True:
-    logits = LLM.inference() # logits is a tensor of shape (batch_size, vocab_size) on GPU
-    # This for loop is parallelizable using threading.Thread. But estimate the overhead in your
-    # engine.
-    for i in range(len(matchers)):
-        matchers[i].fill_next_token_bitmask(token_bitmasks, i)
-    GrammarMatcher.apply_token_bitmask_inplace(logits, token_bitmasks)
-
-    prob = torch.softmax(logits, dim=-1) # get probability from logits
-    next_token_ids = Sampler.sample(logits) # use your own sampler
-
-    for i in range(len(matchers)):
-        matchers[i].accept_token(next_token_ids[i])
-        if matchers[i].is_terminated(): # or your own termination condition
-            requests[i].terminate()
-```
+<div align="center" id="top">
+
+# XGrammar
+
+[![Documentation](https://img.shields.io/badge/docs-latest-green)](https://xgrammar.mlc.ai/docs/)
+[![License](https://img.shields.io/badge/license-apache_2-blue)](https://github.com/mlc-ai/xgrammar/blob/main/LICENSE)
+
+**Flexible, Portable and Fast Structured Generation**
+
+
+[Get Started](#get-started) | [Documentation](https://xgrammar.mlc.ai/docs/) <!-- TODO: | [Blogpost](https://blog.mlc.ai/TODO) -->
+
+</div>
+
+## Overview
+
+XGrammar is open-source solution for flexible, portable, and fast structured generations,
+aiming at bring flexible zero-overhead structure generation everywhere.
+It supports general context-free grammar to enable a broad range of structures
+while bringing careful system optimizations to enable fast executions at tens of microseconds level.
+XGrammar features a minimal and portable c++ backend that can be easily integrated into multiple environments and frameworks,
+and is co-designed with the LLM inference engine, which enables outperformance over existing structure
+generation solutions and enables zero-overhead structured generation in LLM inference.
+
+<!--
+## Key Features
+
+TODO
+WebLLM reference https://github.com/mlc-ai/web-llm/#key-features, if we want to list key features.
+-->
+
+
+## Get Started
+
+Please visit our [documentation](https://xgrammar.mlc.ai/docs/) to get started with XGrammar.
+- [Installation](https://xgrammar.mlc.ai/docs/installation)
+- [Quick start](https://xgrammar.mlc.ai/docs/quick_start)
+
+
+<!--
+## Links
+
+TODO
+- [Demo App: WebLLM Chat](https://chat.webllm.ai/)
+- If you want to run LLM on native runtime, check out [MLC-LLM](https://github.com/mlc-ai/mlc-llm)
+- You might also be interested in [Web Stable Diffusion](https://github.com/mlc-ai/web-stable-diffusion/).
+-->
diff --git a/docs/.gitignore b/docs/.gitignore
new file mode 100644
index 0000000..69fa449
--- /dev/null
+++ b/docs/.gitignore
@@ -0,0 +1 @@
+_build/
diff --git a/docs/Makefile b/docs/Makefile
new file mode 100644
index 0000000..3449de1
--- /dev/null
+++ b/docs/Makefile
@@ -0,0 +1,20 @@
+# Minimal makefile for Sphinx documentation
+#
+
+# You can set these variables from the command line, and also
+# from the environment for the first two.
+SPHINXOPTS    ?=
+SPHINXBUILD   ?= python -m sphinx
+SOURCEDIR     = .
+BUILDDIR      = _build
+
+# Put it first so that "make" without argument is like "make help".
+help:
+	@$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
+
+.PHONY: help Makefile
+
+# Catch-all target: route all unknown targets to Sphinx using the new
+# "make mode" option.  $(O) is meant as a shortcut for $(SPHINXOPTS).
+%: Makefile
+	@$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
diff --git a/docs/README.md b/docs/README.md
new file mode 100644
index 0000000..29aed7f
--- /dev/null
+++ b/docs/README.md
@@ -0,0 +1,30 @@
+# XGrammar Documentation
+
+The documentation was built upon [Sphinx](https://www.sphinx-doc.org/en/master/).
+
+## Dependencies
+
+Run the following command in this directory to install dependencies first:
+
+```bash
+pip3 install -r requirements.txt
+```
+
+## Build the Documentation
+
+Then you can build the documentation by running:
+
+```bash
+make html
+```
+
+## View the Documentation
+
+Run the following command to start a simple HTTP server:
+
+```bash
+cd _build/html
+python3 -m http.server
+```
+
+Then you can view the documentation in your browser at `http://localhost:8000` (the port can be customized by appending ` -p PORT_NUMBER` in the python command above).
diff --git a/docs/_static/img/mlc-logo-with-text-landscape.svg b/docs/_static/img/mlc-logo-with-text-landscape.svg
new file mode 100644
index 0000000..e122d32
--- /dev/null
+++ b/docs/_static/img/mlc-logo-with-text-landscape.svg
@@ -0,0 +1,87 @@
+<?xml version="1.0" encoding="UTF-8" standalone="no"?>
+<svg
+   xmlns:i="&amp;#38;ns_ai;"
+   xmlns:dc="http://purl.org/dc/elements/1.1/"
+   xmlns:cc="http://creativecommons.org/ns#"
+   xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+   xmlns:svg="http://www.w3.org/2000/svg"
+   xmlns="http://www.w3.org/2000/svg"
+   xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
+   xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
+   version="1.1"
+   id="Layer_1"
+   x="0px"
+   y="0px"
+   viewBox="0 0 523.56958 171.35398"
+   xml:space="preserve"
+   sodipodi:docname="mlc-logo-with-text-landscape.svg"
+   width="523.56958"
+   height="171.35399"
+   inkscape:version="1.0.1 (1.0.1+r75)"><metadata
+   id="metadata23"><rdf:RDF><cc:Work
+       rdf:about=""><dc:format>image/svg+xml</dc:format><dc:type
+         rdf:resource="http://purl.org/dc/dcmitype/StillImage" /></cc:Work></rdf:RDF></metadata><defs
+   id="defs21" /><sodipodi:namedview
+   pagecolor="#ffffff"
+   bordercolor="#666666"
+   borderopacity="1"
+   objecttolerance="10"
+   gridtolerance="10"
+   guidetolerance="10"
+   inkscape:pageopacity="0"
+   inkscape:pageshadow="2"
+   inkscape:window-width="1853"
+   inkscape:window-height="1025"
+   id="namedview19"
+   showgrid="false"
+   inkscape:zoom="1.42"
+   inkscape:cx="201.79468"
+   inkscape:cy="119.53208"
+   inkscape:window-x="67"
+   inkscape:window-y="27"
+   inkscape:window-maximized="1"
+   inkscape:current-layer="Layer_1"
+   inkscape:document-rotation="0" />
+<style
+   type="text/css"
+   id="style2">
+	.st0{fill-rule:evenodd;clip-rule:evenodd;fill:#062578;}
+	.st1{fill:#062578;}
+</style>
+<switch
+   id="switch16"
+   transform="translate(19.160879,-130.46791)">
+	<foreignObject
+   requiredExtensions="http://ns.adobe.com/AdobeIllustrator/10.0/"
+   x="0"
+   y="0"
+   width="1"
+   height="1">
+		
+	</foreignObject>
+	<g
+   i:extraneous="self"
+   id="g14">
+		<g
+   id="g12">
+			<path
+   class="st0"
+   d="M 124.8,208.2 H 82.7 c -1.4,0 -2.6,1.2 -2.6,2.6 v 7.5 7.5 3.4 c 1.7,-0.2 3.3,0.1 4.7,0.9 v -11.8 -5.4 h 37.9 v 49.9 H 84.8 v -4.6 -11.1 c -1.1,0.8 -2.3,1.4 -3.4,2 -0.4,0.2 -0.8,0.4 -1.2,0.5 v 9.5 3.6 2.1 c 0,1.4 1.2,2.6 2.6,2.6 h 42.1 c 1.4,0 2.6,-1.1 2.6,-2.6 v -54.2 c -0.1,-1.2 -1.3,-2.4 -2.7,-2.4 z m -44.6,38.5 c -3,1.4 -8.3,2.7 -11.5,3.4 -3.6,0.8 -14.2,3.2 -15.1,-2.5 -0.7,-4.7 11.6,-9.9 14.8,-11.3 2.9,-1.3 5.9,-2.4 8.8,-3.6 3.2,-1.2 6.6,-1.7 8.2,2.3 0.7,1.7 0.9,3.2 0.9,5 v 0.2 0.2 c -0.4,3.1 -3.4,5.1 -6.1,6.3 z m 10.6,-51.3 v 0 c 1.4,-0.1 2.7,0.9 2.8,2.4 l 0.4,4.9 c 0.1,1.4 -0.9,2.7 -2.4,2.8 v 0 c -1.4,0.1 -2.7,-0.9 -2.8,-2.4 l -0.4,-4.9 c -0.1,-1.4 1,-2.6 2.4,-2.8 z m 18.8,10.9 c 0,-2.9 -0.2,-5.7 -0.4,-8.4 v 0 c -0.1,-0.9 -0.2,-1.8 -0.3,-2.7 v -0.1 -0.2 c -0.5,-3.3 -1.1,-6.6 -1.9,-10 -0.8,-3.3 -3.7,-5.4 -7,-5.5 -6.1,-0.1 -12.3,-0.2 -18.4,0 -1,-1.9 -4.2,-3.1 -7.9,-2.9 L 69.5,167 c 0.8,-0.7 1.2,-1.8 1.1,-3 -0.2,-2 -1.9,-3.5 -3.9,-3.3 -2,0.2 -3.5,1.9 -3.3,3.9 0.2,1.9 1.7,3.3 3.6,3.3 l 4,9 c -2.6,0.7 -4.6,2.2 -5.1,3.9 -5.8,0.8 -11.5,2 -17.2,3.1 -0.7,0.1 -1.3,0.4 -1.9,0.6 -6.4,1.6 -13,5.1 -13,5.1 -0.1,0.8 -0.2,1.7 -0.2,2.5 0.3,-0.1 0.6,-0.1 1,-0.2 5,-0.4 9.6,4.7 10.2,11.5 0.6,6.8 -3,12.7 -8,13.1 -0.4,0 -0.8,0 -1.1,0 0.2,0.9 0.4,1.8 0.7,2.6 4.2,2.3 9.9,3.8 13.4,4.6 v 0 c 0.8,0.3 1.7,0.5 2.6,0.5 8.6,0.2 17.3,0.3 25.9,-0.5 h 0.3 v -6.3 c -5.8,0.5 -11.8,0.5 -20.8,0.3 -1.7,0 -2.9,-1.1 -3.4,-2.5 -2,-7.2 -2.5,-14.8 -2,-22.9 0.1,-1.5 1.2,-2.8 2.9,-3.1 1.6,-0.3 3.2,-0.6 4.6,-0.9 0.7,-0.1 2.5,-0.5 3.8,-0.7 v 0 c 1,-0.2 2.1,-0.4 3.1,-0.6 3.3,0.6 5.6,5.4 10.5,4.6 5,-0.1 6.4,-5.2 9.5,-6.3 2.3,0 4.6,0 6.9,0.1 1.1,0 2.1,0 3.9,0.1 1.7,0 3,1 3.4,2.5 0.4,1.6 0.7,3.2 1,4.8 0.6,5.4 0.9,9.8 0.8,13.2 h 6.8 z m -75.1,-7.8 c 2,-0.2 3.8,2.5 4.1,6 0.3,3.5 -1,6.4 -3,6.6 -1,0.1 -1.9,-0.5 -2.6,-1.5 0.4,0.3 0.9,0.5 1.3,0.4 1.5,-0.1 2.6,-2.5 2.3,-5.3 -0.2,-2.8 -1.7,-5 -3.2,-4.8 -0.5,0 -0.9,0.3 -1.2,0.7 0.5,-1.3 1.3,-2.1 2.3,-2.1 z M 77,182.4 c 1.6,0 2.9,1.3 2.9,2.9 0,1.6 -1.3,2.9 -2.9,2.9 -1.6,0 -2.9,-1.3 -2.9,-2.9 -0.1,-1.6 1.3,-2.9 2.9,-2.9 z m -10.3,15.2 v 0 c 1.4,-0.1 2.7,0.9 2.8,2.4 l 0.4,4.9 c 0.1,1.4 -0.9,2.7 -2.4,2.8 v 0 c -1.4,0.1 -2.7,-0.9 -2.8,-2.4 l -0.4,-4.9 c -0.1,-1.4 1,-2.7 2.4,-2.8 z m -32.2,-3.1 c 3.7,-0.3 7.1,3.9 7.6,9.4 0.5,5.5 -2.1,10.2 -5.9,10.6 -3.7,0.3 -7.1,-3.9 -7.6,-9.4 -0.5,-5.6 2.1,-10.3 5.9,-10.6 z m 43.7,66.1 c -3.9,-1 -7.3,-3.6 -8.8,-7.9 2.7,-0.6 5.9,-1.3 8.8,-2.3 z m -10.9,-26.8 -0.7,-7.3 11.6,-0.6 v 3.6 c -0.6,0.2 -1.3,0.4 -1.9,0.6 -3,1.1 -6,2.3 -8.9,3.6 z m -13.1,-0.2 c 3.5,-2.6 7.9,-2.5 9.8,0.1 0.3,0.4 0.5,0.8 0.6,1.3 -4.3,1.9 -10.3,5 -12.6,8.8 -0.3,-0.2 -0.6,-0.5 -0.8,-0.8 -1.9,-2.6 -0.6,-6.8 3,-9.4 z m 48.6,10.7 c 0.7,-0.2 1.4,-0.1 2.1,0 l 0.8,-1.4 0.3,0.1 c 0.7,0.2 1.3,0.6 1.9,1.1 l 0.3,0.2 -0.8,1.4 c 0.2,0.3 0.4,0.5 0.6,0.8 0.2,0.3 0.3,0.6 0.4,0.9 h 1.6 l 0.1,0.4 c 0.1,0.7 0.1,1.5 0,2.2 l -0.1,0.4 h -1.6 c -0.2,0.7 -0.6,1.3 -1,1.8 l 0.8,1.4 -0.3,0.2 c -0.3,0.2 -0.6,0.5 -0.9,0.6 -0.3,0.2 -0.6,0.3 -1,0.5 l -0.3,0.1 -0.8,-1.4 c -0.7,0.1 -1.4,0.1 -2.1,0 l -0.8,1.4 -0.3,-0.1 c -0.7,-0.3 -1.3,-0.6 -1.9,-1.1 l -0.3,-0.2 0.8,-1.4 c -0.2,-0.3 -0.4,-0.5 -0.6,-0.8 -0.2,-0.3 -0.3,-0.6 -0.4,-0.9 h -1.6 l -0.1,-0.4 c -0.1,-0.7 -0.1,-1.5 0,-2.2 l 0.1,-0.4 h 1.6 c 0.2,-0.7 0.6,-1.3 1,-1.8 l -0.8,-1.4 0.3,-0.2 c 0.3,-0.2 0.6,-0.5 0.9,-0.6 0.3,-0.2 0.6,-0.3 1,-0.5 l 0.3,-0.1 z M 88.4,217.9 h 29.9 v 3.2 H 88.4 Z m 0,7.2 h 12.1 v 3.2 H 88.4 Z m 0,7.3 h 9.7 v 3.2 h -9.7 l -0.1,-0.3 v -2.9 z m 25.7,-4.8 c 0.9,0.3 1.7,0.8 2.5,1.4 l 1.9,-1.1 0.3,0.4 c 0.7,0.8 1.2,1.7 1.5,2.6 l 0.2,0.5 -1.9,1.1 c 0.1,0.5 0.2,0.9 0.2,1.4 0,0.5 -0.1,1 -0.2,1.4 l 1.9,1.1 -0.2,0.5 c -0.3,0.9 -0.9,1.8 -1.5,2.6 l -0.3,0.4 -1.9,-1.1 c -0.7,0.6 -1.5,1.1 -2.5,1.4 v 2.2 l -0.5,0.1 c -0.5,0.1 -1,0.1 -1.5,0.1 -0.5,0 -1,0 -1.5,-0.1 l -0.5,-0.1 v -2.2 c -0.9,-0.3 -1.7,-0.8 -2.5,-1.4 l -1.9,1.1 -0.3,-0.4 c -0.6,-0.8 -1.2,-1.7 -1.5,-2.6 l -0.2,-0.5 1.9,-1.1 c -0.1,-0.5 -0.2,-0.9 -0.2,-1.4 0,-0.5 0.1,-0.9 0.2,-1.4 l -1.9,-1.1 0.2,-0.5 c 0.3,-0.9 0.9,-1.8 1.5,-2.6 l 0.3,-0.4 1.9,1.1 c 0.7,-0.6 1.5,-1.1 2.5,-1.4 v -2.2 l 0.5,-0.1 c 0.5,-0.1 1,-0.1 1.5,-0.1 0.5,0 1,0 1.5,0.1 l 0.5,0.1 z m -2,3 c -1.8,0 -3.3,1.5 -3.3,3.3 0,1.8 1.5,3.3 3.3,3.3 1.8,0 3.3,-1.5 3.3,-3.3 0,-1.8 -1.5,-3.3 -3.3,-3.3 z m -9.5,16.3 c -1.2,0.7 -1.6,2.2 -0.9,3.3 0.7,1.2 2.2,1.6 3.3,0.9 1.2,-0.7 1.6,-2.2 0.9,-3.3 -0.7,-1.2 -2.1,-1.6 -3.3,-0.9 z"
+   id="path4" />
+			<path
+   class="st1"
+   d="m 172,209.4 v 22.9 h -4.7 v -13.2 c 0,-0.3 0,-0.6 0,-1 0,-0.4 0,-0.7 0.1,-1.1 l -6.1,11.8 c -0.2,0.4 -0.4,0.6 -0.8,0.8 -0.3,0.2 -0.7,0.3 -1.1,0.3 h -0.7 c -0.4,0 -0.8,-0.1 -1.1,-0.3 -0.3,-0.2 -0.6,-0.5 -0.8,-0.8 L 150.7,217 c 0,0.4 0.1,0.7 0.1,1.1 0,0.4 0,0.7 0,1 v 13.2 h -4.7 v -22.9 h 4.1 c 0.2,0 0.4,0 0.6,0 0.2,0 0.3,0 0.5,0.1 0.1,0.1 0.3,0.1 0.4,0.2 0.1,0.1 0.2,0.3 0.3,0.5 l 5.9,11.6 c 0.2,0.4 0.4,0.8 0.6,1.2 0.2,0.4 0.4,0.9 0.6,1.3 0.2,-0.5 0.4,-0.9 0.6,-1.4 0.2,-0.4 0.4,-0.9 0.6,-1.3 l 5.9,-11.6 c 0.1,-0.2 0.2,-0.4 0.3,-0.5 0.1,-0.1 0.2,-0.2 0.4,-0.2 0.1,-0.1 0.3,-0.1 0.5,-0.1 0.2,0 0.4,0 0.6,0 h 4 z m 16.6,14.1 -2.1,-6.3 c -0.2,-0.4 -0.3,-0.9 -0.5,-1.4 -0.2,-0.5 -0.4,-1.1 -0.5,-1.8 -0.2,0.6 -0.3,1.2 -0.5,1.8 -0.2,0.5 -0.3,1 -0.5,1.4 l -2.1,6.2 h 6.2 z m 8.4,8.8 h -4.1 c -0.5,0 -0.8,-0.1 -1.1,-0.3 -0.3,-0.2 -0.5,-0.5 -0.6,-0.8 l -1.4,-4 h -8.7 l -1.4,4 c -0.1,0.3 -0.3,0.6 -0.6,0.8 -0.3,0.2 -0.7,0.4 -1.1,0.4 h -4.2 l 8.9,-22.9 h 5.4 z m 16.5,-6 c 0.1,0 0.3,0 0.4,0.1 0.1,0 0.2,0.1 0.4,0.2 l 2.1,2.2 c -0.9,1.2 -2.1,2.1 -3.5,2.7 -1.4,0.6 -3,0.9 -4.9,0.9 -1.7,0 -3.3,-0.3 -4.7,-0.9 -1.4,-0.6 -2.5,-1.4 -3.5,-2.5 -1,-1 -1.7,-2.3 -2.2,-3.7 -0.5,-1.4 -0.8,-3 -0.8,-4.7 0,-1.7 0.3,-3.3 0.8,-4.7 0.6,-1.4 1.3,-2.7 2.3,-3.7 1,-1 2.2,-1.8 3.6,-2.4 1.4,-0.6 3,-0.9 4.6,-0.9 0.9,0 1.7,0.1 2.4,0.2 0.8,0.2 1.5,0.4 2.1,0.6 0.7,0.3 1.3,0.6 1.8,1 0.6,0.4 1,0.8 1.5,1.2 l -1.8,2.4 c -0.1,0.1 -0.3,0.3 -0.4,0.4 -0.2,0.1 -0.4,0.2 -0.7,0.2 -0.2,0 -0.4,0 -0.5,-0.1 -0.2,-0.1 -0.3,-0.2 -0.5,-0.3 -0.2,-0.1 -0.4,-0.3 -0.6,-0.4 -0.2,-0.1 -0.5,-0.3 -0.8,-0.4 -0.3,-0.1 -0.7,-0.2 -1.1,-0.3 -0.4,-0.1 -0.9,-0.1 -1.5,-0.1 -0.9,0 -1.7,0.2 -2.4,0.5 -0.7,0.3 -1.4,0.8 -1.9,1.4 -0.5,0.6 -0.9,1.4 -1.2,2.3 -0.3,0.9 -0.4,1.9 -0.4,3.1 0,1.2 0.2,2.2 0.5,3.1 0.3,0.9 0.8,1.7 1.3,2.3 0.6,0.6 1.2,1.1 1.9,1.4 0.7,0.3 1.5,0.5 2.4,0.5 0.5,0 0.9,0 1.3,-0.1 0.4,0 0.8,-0.1 1.1,-0.2 0.3,-0.1 0.7,-0.3 1,-0.4 0.3,-0.2 0.6,-0.4 0.9,-0.7 0.1,-0.1 0.3,-0.2 0.4,-0.3 0.3,0.2 0.5,0.1 0.6,0.1 z m 25.2,-16.9 v 22.9 h -5.3 v -9.7 h -9.3 v 9.7 h -5.4 v -22.9 h 5.4 v 9.6 h 9.3 v -9.6 z m 9.8,22.9 h -5.4 v -22.9 h 5.4 z M 273,209.4 v 22.9 h -2.8 c -0.4,0 -0.8,-0.1 -1,-0.2 -0.3,-0.1 -0.6,-0.4 -0.8,-0.7 l -10.8,-13.7 c 0,0.4 0.1,0.8 0.1,1.2 0,0.4 0,0.7 0,1.1 v 12.3 H 253 v -22.9 h 2.8 c 0.2,0 0.4,0 0.6,0 0.2,0 0.3,0.1 0.4,0.1 0.1,0.1 0.2,0.1 0.4,0.2 0.1,0.1 0.2,0.2 0.4,0.4 l 10.9,13.8 c -0.1,-0.4 -0.1,-0.9 -0.1,-1.3 0,-0.4 0,-0.8 0,-1.2 v -12.1 h 4.6 z m 9.8,4 v 5.4 h 7.2 v 3.9 h -7.2 v 5.5 h 9.4 v 4.1 h -14.8 v -22.9 h 14.8 v 4.1 h -9.4 z"
+   id="path6" />
+			<path
+   class="st1"
+   d="m 316.5,228 v 4.2 H 302.7 V 209.3 H 308 V 228 Z m 8.1,-14.6 v 5.4 h 7.2 v 3.9 h -7.2 v 5.5 h 9.4 v 4.1 H 319.2 V 209.4 H 334 v 4.1 h -9.4 z m 24.8,10.1 -2.1,-6.3 c -0.2,-0.4 -0.3,-0.9 -0.5,-1.4 -0.2,-0.5 -0.4,-1.1 -0.5,-1.8 -0.2,0.6 -0.3,1.2 -0.5,1.8 -0.2,0.5 -0.3,1 -0.5,1.4 l -2.1,6.2 h 6.2 z m 8.4,8.8 h -4.1 c -0.5,0 -0.8,-0.1 -1.1,-0.3 -0.3,-0.2 -0.5,-0.5 -0.6,-0.8 l -1.4,-4 h -8.7 l -1.4,4 c -0.1,0.3 -0.3,0.6 -0.6,0.8 -0.3,0.2 -0.7,0.4 -1.1,0.4 h -4.2 l 8.9,-22.9 h 5.4 z m 9.3,-12.2 c 0.7,0 1.3,-0.1 1.9,-0.3 0.5,-0.2 0.9,-0.4 1.2,-0.8 0.3,-0.3 0.6,-0.7 0.7,-1.1 0.1,-0.4 0.2,-0.9 0.2,-1.4 0,-1 -0.3,-1.8 -1,-2.4 -0.7,-0.6 -1.7,-0.8 -3,-0.8 H 365 v 6.8 z m 11.3,12.2 h -4.8 c -0.9,0 -1.5,-0.3 -1.9,-1 l -3.8,-6.7 c -0.2,-0.3 -0.4,-0.5 -0.6,-0.6 -0.2,-0.1 -0.5,-0.2 -0.9,-0.2 H 365 v 8.5 h -5.3 v -22.9 h 7.5 c 1.7,0 3.1,0.2 4.2,0.5 1.2,0.3 2.1,0.8 2.9,1.4 0.7,0.6 1.3,1.3 1.6,2.2 0.3,0.8 0.5,1.7 0.5,2.7 0,0.7 -0.1,1.4 -0.3,2.1 -0.2,0.7 -0.5,1.3 -0.9,1.8 -0.4,0.6 -0.9,1.1 -1.4,1.5 -0.6,0.4 -1.2,0.8 -2,1.1 0.3,0.2 0.7,0.4 1,0.7 0.3,0.3 0.6,0.6 0.8,1 z m 22,-22.9 v 22.9 h -2.8 c -0.4,0 -0.8,-0.1 -1,-0.2 -0.3,-0.1 -0.6,-0.4 -0.8,-0.7 L 385,217.7 c 0,0.4 0.1,0.8 0.1,1.2 0,0.4 0,0.7 0,1.1 v 12.3 h -4.7 v -22.9 h 2.8 c 0.2,0 0.4,0 0.6,0 0.2,0 0.3,0.1 0.4,0.1 0.1,0.1 0.2,0.1 0.4,0.2 0.1,0.1 0.2,0.2 0.4,0.4 l 10.9,13.8 c -0.1,-0.4 -0.1,-0.9 -0.1,-1.3 0,-0.4 0,-0.8 0,-1.2 v -12.1 h 4.6 z m 9.7,22.9 h -5.4 v -22.9 h 5.4 z m 24.5,-22.9 v 22.9 h -2.8 c -0.4,0 -0.7,-0.1 -1,-0.2 -0.3,-0.1 -0.6,-0.4 -0.8,-0.7 l -10.8,-13.7 c 0,0.4 0.1,0.8 0.1,1.2 0,0.4 0,0.7 0,1.1 v 12.3 h -4.7 v -22.9 h 2.8 c 0.2,0 0.4,0 0.6,0 0.2,0 0.3,0.1 0.4,0.1 0.1,0.1 0.2,0.1 0.4,0.2 0.1,0.1 0.2,0.2 0.4,0.4 l 10.9,13.8 c -0.1,-0.4 -0.1,-0.9 -0.1,-1.3 0,-0.4 0,-0.8 0,-1.2 v -12.1 h 4.6 z m 15.5,11 h 8.2 v 9.7 c -1.2,0.9 -2.4,1.5 -3.8,1.9 -1.3,0.4 -2.7,0.6 -4.2,0.6 -1.9,0 -3.6,-0.3 -5.2,-0.9 -1.5,-0.6 -2.9,-1.4 -4,-2.5 -1.1,-1 -2,-2.3 -2.5,-3.7 -0.6,-1.4 -0.9,-3 -0.9,-4.7 0,-1.7 0.3,-3.3 0.9,-4.7 0.6,-1.4 1.4,-2.7 2.4,-3.7 1.1,-1 2.3,-1.8 3.8,-2.4 1.5,-0.6 3.2,-0.9 5,-0.9 1,0 1.9,0.1 2.7,0.2 0.8,0.2 1.6,0.4 2.3,0.6 0.7,0.3 1.4,0.6 1.9,1 0.6,0.4 1.1,0.8 1.6,1.2 l -1.5,2.3 c -0.2,0.4 -0.6,0.6 -0.9,0.7 -0.4,0.1 -0.8,0 -1.2,-0.3 -0.4,-0.3 -0.8,-0.5 -1.2,-0.7 -0.4,-0.2 -0.8,-0.3 -1.1,-0.4 -0.4,-0.1 -0.8,-0.2 -1.2,-0.3 -0.4,-0.1 -0.9,-0.1 -1.4,-0.1 -1,0 -1.9,0.2 -2.7,0.5 -0.8,0.4 -1.5,0.9 -2,1.5 -0.6,0.6 -1,1.4 -1.3,2.3 -0.3,0.9 -0.5,1.9 -0.5,3 0,1.2 0.2,2.3 0.5,3.2 0.3,0.9 0.8,1.7 1.4,2.4 0.6,0.7 1.3,1.1 2.2,1.5 0.9,0.3 1.8,0.5 2.8,0.5 0.6,0 1.2,-0.1 1.7,-0.2 0.5,-0.1 1,-0.3 1.5,-0.5 V 224 h -2.3 c -0.3,0 -0.6,-0.1 -0.8,-0.3 -0.2,-0.2 -0.3,-0.4 -0.3,-0.7 v -2.6 z"
+   id="path8" />
+			<path
+   class="st1"
+   d="m 155.6,253.7 c 0.1,0 0.2,0 0.3,0.1 0.1,0 0.2,0.1 0.3,0.2 l 1.5,1.6 c -0.7,0.9 -1.5,1.5 -2.5,2 -1,0.4 -2.2,0.7 -3.6,0.7 -1.3,0 -2.4,-0.2 -3.4,-0.7 -1,-0.4 -1.9,-1 -2.6,-1.8 -0.7,-0.8 -1.2,-1.7 -1.6,-2.7 -0.4,-1 -0.6,-2.2 -0.6,-3.4 0,-1.2 0.2,-2.4 0.6,-3.4 0.4,-1 1,-1.9 1.7,-2.7 0.7,-0.8 1.6,-1.3 2.6,-1.8 1,-0.4 2.2,-0.6 3.4,-0.6 0.6,0 1.2,0.1 1.8,0.2 0.6,0.1 1.1,0.3 1.6,0.5 0.5,0.2 0.9,0.4 1.3,0.7 0.4,0.3 0.8,0.6 1.1,0.9 l -1.3,1.8 c -0.1,0.1 -0.2,0.2 -0.3,0.3 -0.1,0.1 -0.3,0.1 -0.5,0.1 -0.1,0 -0.3,0 -0.4,-0.1 -0.1,-0.1 -0.3,-0.1 -0.4,-0.2 -0.1,-0.1 -0.3,-0.2 -0.5,-0.3 -0.2,-0.1 -0.4,-0.2 -0.6,-0.3 -0.2,-0.1 -0.5,-0.2 -0.8,-0.2 -0.3,-0.1 -0.7,-0.1 -1.1,-0.1 -0.6,0 -1.2,0.1 -1.8,0.4 -0.5,0.2 -1,0.6 -1.4,1 -0.4,0.5 -0.7,1 -0.9,1.7 -0.2,0.7 -0.3,1.4 -0.3,2.3 0,0.9 0.1,1.6 0.4,2.3 0.2,0.7 0.6,1.2 1,1.7 0.4,0.5 0.9,0.8 1.4,1 0.5,0.2 1.1,0.4 1.7,0.4 0.4,0 0.7,0 1,-0.1 0.3,0 0.6,-0.1 0.8,-0.2 0.3,-0.1 0.5,-0.2 0.7,-0.3 0.2,-0.1 0.4,-0.3 0.7,-0.5 0.1,-0.1 0.2,-0.1 0.3,-0.2 0.2,-0.3 0.3,-0.3 0.4,-0.3 z m 36.1,-4.1 c 0,1.2 -0.2,2.3 -0.6,3.4 -0.4,1 -1,1.9 -1.8,2.7 -0.8,0.8 -1.7,1.4 -2.7,1.8 -1.1,0.4 -2.3,0.7 -3.6,0.7 -1.3,0 -2.5,-0.2 -3.6,-0.7 -1.1,-0.4 -2,-1 -2.7,-1.8 -0.8,-0.8 -1.4,-1.7 -1.8,-2.7 -0.4,-1 -0.6,-2.2 -0.6,-3.4 0,-1.2 0.2,-2.3 0.6,-3.4 0.4,-1 1,-1.9 1.8,-2.7 0.8,-0.8 1.7,-1.4 2.7,-1.8 1.1,-0.4 2.3,-0.7 3.6,-0.7 1.3,0 2.5,0.2 3.6,0.7 1.1,0.4 2,1 2.7,1.8 0.8,0.8 1.3,1.7 1.8,2.7 0.4,1.1 0.6,2.2 0.6,3.4 z m -3.9,0 c 0,-0.8 -0.1,-1.6 -0.3,-2.2 -0.2,-0.7 -0.5,-1.2 -0.9,-1.7 -0.4,-0.5 -0.9,-0.8 -1.5,-1.1 -0.6,-0.2 -1.2,-0.4 -2,-0.4 -0.8,0 -1.4,0.1 -2,0.4 -0.6,0.2 -1.1,0.6 -1.5,1.1 -0.4,0.5 -0.7,1 -0.9,1.7 -0.2,0.7 -0.3,1.4 -0.3,2.2 0,0.8 0.1,1.6 0.3,2.2 0.2,0.7 0.5,1.2 0.9,1.7 0.4,0.5 0.9,0.8 1.5,1 0.6,0.2 1.3,0.4 2,0.4 0.7,0 1.4,-0.1 2,-0.4 0.6,-0.2 1.1,-0.6 1.5,-1 0.4,-0.5 0.7,-1 0.9,-1.7 0.2,-0.6 0.3,-1.3 0.3,-2.2 z m 41,-8.3 V 258 h -3.4 v -9.6 c 0,-0.2 0,-0.5 0,-0.7 0,-0.3 0,-0.5 0.1,-0.8 l -4.4,8.6 c -0.1,0.3 -0.3,0.5 -0.6,0.6 -0.2,0.1 -0.5,0.2 -0.8,0.2 h -0.5 c -0.3,0 -0.6,-0.1 -0.8,-0.2 -0.2,-0.1 -0.4,-0.3 -0.6,-0.6 l -4.4,-8.6 c 0,0.3 0,0.5 0.1,0.8 0,0.3 0,0.5 0,0.7 v 9.6 h -3.4 v -16.7 h 3 c 0.2,0 0.3,0 0.4,0 0.1,0 0.2,0 0.3,0.1 0.1,0 0.2,0.1 0.3,0.2 0.1,0.1 0.2,0.2 0.2,0.3 l 4.3,8.5 c 0.2,0.3 0.3,0.6 0.4,0.9 0.1,0.3 0.3,0.6 0.4,1 0.1,-0.3 0.3,-0.7 0.4,-1 0.1,-0.3 0.3,-0.6 0.5,-0.9 l 4.3,-8.5 c 0.1,-0.1 0.2,-0.3 0.2,-0.3 0.1,-0.1 0.2,-0.1 0.3,-0.2 0.1,0 0.2,-0.1 0.3,-0.1 0.1,0 0.3,0 0.4,0 z m 25,8.2 c 1,0 1.7,-0.2 2.2,-0.7 0.4,-0.5 0.7,-1.2 0.7,-2 0,-0.4 -0.1,-0.7 -0.2,-1 -0.1,-0.3 -0.3,-0.6 -0.5,-0.8 -0.2,-0.2 -0.5,-0.4 -0.9,-0.5 -0.4,-0.1 -0.8,-0.2 -1.3,-0.2 h -2 v 5.3 h 2 z m 0,-8.2 c 1.2,0 2.2,0.1 3,0.4 0.8,0.3 1.5,0.7 2.1,1.2 0.5,0.5 0.9,1.1 1.2,1.7 0.3,0.7 0.4,1.4 0.4,2.2 0,0.8 -0.1,1.6 -0.4,2.3 -0.3,0.7 -0.7,1.3 -1.2,1.8 -0.6,0.5 -1.2,0.9 -2.1,1.2 -0.8,0.3 -1.8,0.4 -3,0.4 h -2 v 5.6 h -3.9 v -16.7 h 5.9 z m 27.9,16.7 h -3.9 v -16.7 h 3.9 z m 29.3,-3.1 v 3.1 h -10.1 v -16.7 h 3.9 v 13.6 z m 25.2,-3.3 -1.6,-4.6 c -0.1,-0.3 -0.2,-0.6 -0.4,-1 -0.1,-0.4 -0.3,-0.8 -0.4,-1.3 -0.1,0.5 -0.2,0.9 -0.4,1.3 -0.1,0.4 -0.3,0.7 -0.4,1 l -1.5,4.6 z m 6.2,6.4 h -3 c -0.3,0 -0.6,-0.1 -0.8,-0.2 -0.2,-0.2 -0.4,-0.4 -0.5,-0.6 l -1,-2.9 h -6.4 l -1,2.9 c -0.1,0.2 -0.2,0.4 -0.5,0.6 -0.2,0.2 -0.5,0.3 -0.8,0.3 h -3 l 6.5,-16.7 h 4 z m 27.8,-13.6 h -4.7 V 258 h -3.9 v -13.7 h -4.7 v -3.1 h 13.3 z m 21.1,13.6 h -3.9 v -16.7 h 3.9 z m 35.5,-8.4 c 0,1.2 -0.2,2.3 -0.6,3.4 -0.4,1 -1,1.9 -1.8,2.7 -0.8,0.8 -1.7,1.4 -2.7,1.8 -1.1,0.4 -2.3,0.7 -3.6,0.7 -1.3,0 -2.5,-0.2 -3.6,-0.7 -1.1,-0.4 -2,-1 -2.7,-1.8 -0.8,-0.8 -1.4,-1.7 -1.8,-2.7 -0.4,-1 -0.6,-2.2 -0.6,-3.4 0,-1.2 0.2,-2.3 0.6,-3.4 0.4,-1 1,-1.9 1.8,-2.7 0.8,-0.8 1.7,-1.4 2.7,-1.8 1.1,-0.4 2.3,-0.7 3.6,-0.7 1.3,0 2.5,0.2 3.6,0.7 1.1,0.4 2,1 2.7,1.8 0.8,0.8 1.3,1.7 1.8,2.7 0.4,1.1 0.6,2.2 0.6,3.4 z m -3.9,0 c 0,-0.8 -0.1,-1.6 -0.3,-2.2 -0.2,-0.7 -0.5,-1.2 -0.9,-1.7 -0.4,-0.5 -0.9,-0.8 -1.5,-1.1 -0.6,-0.2 -1.2,-0.4 -2,-0.4 -0.8,0 -1.4,0.1 -2,0.4 -0.6,0.2 -1.1,0.6 -1.5,1.1 -0.4,0.5 -0.7,1 -0.9,1.7 -0.2,0.7 -0.3,1.4 -0.3,2.2 0,0.8 0.1,1.6 0.3,2.2 0.2,0.7 0.5,1.2 0.9,1.7 0.4,0.5 0.9,0.8 1.5,1 0.6,0.2 1.3,0.4 2,0.4 0.7,0 1.4,-0.1 2,-0.4 0.6,-0.2 1.1,-0.6 1.5,-1 0.4,-0.5 0.7,-1 0.9,-1.7 0.2,-0.6 0.3,-1.3 0.3,-2.2 z m 36.8,-8.3 V 258 h -2 c -0.3,0 -0.5,-0.1 -0.8,-0.1 -0.2,-0.1 -0.4,-0.3 -0.6,-0.5 l -7.9,-10 c 0,0.3 0.1,0.6 0.1,0.9 0,0.3 0,0.5 0,0.8 v 9 h -3.4 v -16.7 h 2 c 0.2,0 0.3,0 0.4,0 0.1,0 0.2,0 0.3,0.1 0.1,0 0.2,0.1 0.3,0.2 0.1,0.1 0.2,0.2 0.3,0.3 l 8,10.1 c 0,-0.3 -0.1,-0.6 -0.1,-0.9 0,-0.3 0,-0.6 0,-0.9 v -8.9 h 3.4 z"
+   id="path10" />
+		</g>
+	</g>
+</switch>
+
+</svg>
diff --git a/docs/conf.py b/docs/conf.py
new file mode 100644
index 0000000..efc890c
--- /dev/null
+++ b/docs/conf.py
@@ -0,0 +1,102 @@
+# -*- coding: utf-8 -*-
+import os
+import sys
+
+import tlcpack_sphinx_addon
+
+# -- General configuration ------------------------------------------------
+
+sys.path.insert(0, os.path.abspath("../python"))
+sys.path.insert(0, os.path.abspath("../"))
+autodoc_mock_imports = ["torch"]
+
+# General information about the project.
+project = "XGrammar"
+author = "XGrammar Contributors"
+copyright = "2024, %s" % author
+
+# Version information.
+
+version = "0.1.0"
+release = "0.1.0"
+
+extensions = [
+    "sphinx_tabs.tabs",
+    "sphinx_toolbox.collapse",
+    "sphinxcontrib.httpdomain",
+    "sphinx.ext.autodoc",
+    "sphinx.ext.napoleon",
+    "sphinx_reredirects",
+]
+
+redirects = {}
+
+source_suffix = [".rst"]
+
+language = "en"
+
+exclude_patterns = ["_build", "Thumbs.db", ".DS_Store"]
+
+# The name of the Pygments (syntax highlighting) style to use.
+pygments_style = "sphinx"
+
+# A list of ignored prefixes for module index sorting.
+# If true, `todo` and `todoList` produce output, else they produce nothing.
+todo_include_todos = False
+
+# -- Options for HTML output ----------------------------------------------
+
+# The theme is set by the make target
+import sphinx_rtd_theme
+
+html_theme = "sphinx_rtd_theme"
+html_theme_path = [sphinx_rtd_theme.get_html_theme_path()]
+
+templates_path = []
+
+html_static_path = []
+
+footer_copyright = "© 2024 XGrammar"
+footer_note = " "
+
+# html_logo = "_static/img/mlc-logo-with-text-landscape.svg"
+
+html_theme_options = {
+    "logo_only": False,
+}
+
+header_links = [
+    ("Home", "https://xgrammar.mlc.ai/"),
+    ("Github", "https://github.com/mlc-ai/xgrammar"),
+]
+
+header_dropdown = {
+    "name": "Other Resources",
+    "items": [
+        ("MLC Course", "https://mlc.ai/"),
+        ("MLC Blog", "https://blog.mlc.ai/"),
+        ("MLC LLM", "https://llm.mlc.ai/"),
+        ("Web LLM", "https://webllm.mlc.ai/"),
+        ("SGLang", "https://github.com/sgl-project/sglang"),
+    ],
+}
+
+html_context = {
+    "footer_copyright": footer_copyright,
+    "footer_note": footer_note,
+    "header_links": header_links,
+    "header_dropdown": header_dropdown,
+    "display_github": True,
+    "github_user": "mlc-ai",
+    "github_repo": "xgrammar",
+    "github_version": "main/docs/",
+    "theme_vcs_pageview_mode": "edit",
+    # "header_logo": "/path/to/logo",
+    # "header_logo_link": "",
+    # "version_selecter": "",
+}
+
+
+# add additional overrides
+templates_path += [tlcpack_sphinx_addon.get_templates_path()]
+html_static_path += [tlcpack_sphinx_addon.get_static_path()]
diff --git a/docs/index.rst b/docs/index.rst
new file mode 100644
index 0000000..daef3a0
--- /dev/null
+++ b/docs/index.rst
@@ -0,0 +1,32 @@
+👋 Welcome to XGrammar
+======================
+
+`GitHub <https://github.com/mlc-ai/xgrammar>`_
+
+
+
+XGrammar is open-source solution for flexible, portable, and fast structured generations.
+The mission of this project is to bring flexible zero-overhead structure generation everywhere.
+
+Quick Start
+-----------
+
+Check out :ref:`quick-start` for quick start examples of using MLC LLM.
+
+
+.. toctree::
+   :maxdepth: 1
+   :caption: Get Started
+   :hidden:
+
+   start/install.rst
+   start/quick_start.rst
+
+.. toctree::
+   :maxdepth: 1
+   :caption: Tutorials
+   :hidden:
+
+   tutorials/json_generation.rst
+   .. tutorials/backend_integration.rst  .. TODO
+   .. tutorials/web_sdk.rst              .. TODO
diff --git a/docs/make.bat b/docs/make.bat
new file mode 100644
index 0000000..32bb245
--- /dev/null
+++ b/docs/make.bat
@@ -0,0 +1,35 @@
+@ECHO OFF
+
+pushd %~dp0
+
+REM Command file for Sphinx documentation
+
+if "%SPHINXBUILD%" == "" (
+	set SPHINXBUILD=sphinx-build
+)
+set SOURCEDIR=.
+set BUILDDIR=_build
+
+%SPHINXBUILD% >NUL 2>NUL
+if errorlevel 9009 (
+	echo.
+	echo.The 'sphinx-build' command was not found. Make sure you have Sphinx
+	echo.installed, then set the SPHINXBUILD environment variable to point
+	echo.to the full path of the 'sphinx-build' executable. Alternatively you
+	echo.may add the Sphinx directory to PATH.
+	echo.
+	echo.If you don't have Sphinx installed, grab it from
+	echo.https://www.sphinx-doc.org/
+	exit /b 1
+)
+
+if "%1" == "" goto help
+
+%SPHINXBUILD% -M %1 %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
+goto end
+
+:help
+%SPHINXBUILD% -M help %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
+
+:end
+popd
diff --git a/docs/requirements.txt b/docs/requirements.txt
new file mode 100644
index 0000000..2658857
--- /dev/null
+++ b/docs/requirements.txt
@@ -0,0 +1,8 @@
+sphinx-tabs == 3.4.1
+sphinx-rtd-theme
+sphinx == 5.2.3
+sphinx-toolbox == 3.4.0
+tlcpack-sphinx-addon==0.2.2
+sphinxcontrib_httpdomain==1.8.1
+sphinxcontrib-napoleon==0.7
+sphinx-reredirects==0.1.2
diff --git a/docs/start/install.rst b/docs/start/install.rst
new file mode 100644
index 0000000..f69cfd8
--- /dev/null
+++ b/docs/start/install.rst
@@ -0,0 +1,95 @@
+.. _installation:
+
+Installation
+============
+
+.. contents:: Table of Contents
+    :local:
+    :depth: 2
+
+XGrammar Python Package can be installed directly from a prebuilt developer package,
+or built from source.
+
+
+.. _installation_prebuilt_package:
+
+Option 1. Prebuilt Package
+--------------------------
+
+We provide nightly built pip wheels for XGrammar via pip.
+Select your operating system/compute platform and run the command in your terminal:
+
+.. note::
+    ❗ Whenever using Python, it is highly recommended to use **conda** to manage an isolated Python environment to avoid missing dependencies, incompatible versions, and package conflicts.
+    Please make sure your conda environment has Python and pip installed.
+
+.. code-block:: bash
+
+    conda activate your-environment
+    # TODO
+    python -m pip install ...
+
+
+.. python -m pip install --pre -U -f https://mlc.ai/wheels mlc-llm-nightly-cpu mlc-ai-nightly-cpu
+
+
+Then you can verify installation in command line:
+
+.. code-block:: bash
+
+    python -c "import xgrammar; print(xgrammar)"
+    # Prints out: <module 'xgrammar' from '/path-to-env/lib/python3.11/site-packages/xgrammar/__init__.py'>
+
+|
+
+.. _installation_build_from_source:
+
+Option 2. Build from Source
+---------------------------
+
+We also provide options to build XGrammar from source.
+This step is useful when you want to make modification or obtain a specific version of XGrammar.
+
+
+**Step 1. Set up build dependency.** To build from source, you need to ensure that the following build dependencies are satisfied:
+
+* CMake >= 3.18
+* Git
+
+.. code-block:: bash
+
+    # make sure to start with a fresh environment
+    conda env remove -n xgrammar-venv
+    # create the conda environment with build dependency
+    conda create -n xgrammar-venv -c conda-forge \
+        "cmake>=3.18" \
+        git \
+        python=3.11
+    # enter the build environment
+    conda activate xgrammar-venv
+    # install Python dependency
+    python3 -m pip install ninja pybind11 torch
+
+
+**Step 2. Configure, build and install.** A standard git-based workflow is recommended to download XGrammar.
+
+.. code-block:: bash
+
+    # 1. clone from GitHub
+    git clone --recursive https://github.com/mlc-ai/xgrammar.git && cd xgrammar
+    # 2. build XGrammar core and Python bindings
+    mkdir build && cd build
+    cmake .. -G Ninja
+    ninja
+    # 3. install the Python package
+    cd ../python
+    python3 -m pip install .
+    # 4. (optional) add the python directory to PATH
+    echo "export PATH=$(pwd):$PATH" >> ~/.bashrc
+
+**Step 3. Validate installation.** You may validate if XGrammar is compiled successfully in command line.
+You should see the path you used to build from source with:
+
+.. code:: bash
+
+   python -c "import xgrammar; print(xgrammar)"
diff --git a/docs/start/quick_start.rst b/docs/start/quick_start.rst
new file mode 100644
index 0000000..dd416c4
--- /dev/null
+++ b/docs/start/quick_start.rst
@@ -0,0 +1,17 @@
+.. _quick-start:
+
+Quick Start
+===========
+
+Example
+-------
+
+TODO
+
+
+What to Do Next
+---------------
+
+- Check out :ref:`tutorial-json-generation` for the usage guide of XGrammar.
+- Report any problem or ask any question: open new issues in our `GitHub repo <https://github.com/mlc-ai/xgrammar/issues>`_.
+
diff --git a/docs/tutorials/json_generation.rst b/docs/tutorials/json_generation.rst
new file mode 100644
index 0000000..bd17b35
--- /dev/null
+++ b/docs/tutorials/json_generation.rst
@@ -0,0 +1,199 @@
+.. _tutorial-json-generation:
+
+JSON Generation
+====================
+
+
+Install XGrammar
+~~~~~~~~~~~~~~~~
+
+:ref:`XGrammar <installation_prebuilt_package>` is available via pip.
+It is always recommended to install it in an isolated conda virtual environment.
+
+
+.. _tutorial-json-generation-construct-grammar:
+
+Step 1: Construct a grammar
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+XGrammar provides the following methods to flexibly construct a grammar.
+You can choose from any of the following ways to construct grammar from different sources.
+
+**Method 1: Construct with a GBNF string.**
+The GBNF (GGML BNF) specification is available
+`here <https://github.com/ggerganov/llama.cpp/blob/master/grammars/README.md>`__.
+
+
+.. code:: python
+
+  from xgrammar import BNFGrammar
+
+  # Method 1: Construct with a GBNF string.
+  gbnf_grammar = """
+  root  ::= (expr "=" term "\n")+
+  expr  ::= term ([-+*/] term)*
+  term  ::= num | "(" expr ")"
+  num   ::= [0-9]+
+  """
+  gbnf_grammar = BNFGrammar(gbnf_grammar)
+
+
+**Method 2: Use the builtin JSON grammar.**
+
+.. code:: python
+
+  from xgrammar import BuiltinGrammar
+
+  # Method 2: Use the builtin JSON grammar.
+  json_grammar = BuiltinGrammar.json()
+
+
+**Method 3: Construct from a Pydantic model.**
+
+.. code:: python
+
+  from xgrammar import BuiltinGrammar
+  from pydantic import BaseModel
+
+  # Method 3: Construct from a Pydantic model.
+  class Person(BaseModel):
+      name: str
+      age: int
+  json_schema_pydantic = BuiltinGrammar.json_schema(Person)
+
+**Method 4: Construct from a JSON schema string.**
+
+.. code:: python
+
+  import json
+  from xgrammar import BuiltinGrammar
+
+  # Method 4: Construct from a JSON schema string.
+  person_schema = {
+    "title": "Person",
+    "type": "object",
+    "properties": {
+      "name": {
+        "type": "string"
+      },
+      "age": {
+        "type": "integer",
+      }
+    },
+    "required": ["name", "age"]
+  }
+  json_schema_str = BuiltinGrammar.json_schema(json.dumps(person_schema))
+
+
+.. _tutorial-json-generation-compile-grammar:
+
+Step 2: Compile grammars
+~~~~~~~~~~~~~~~~~~~~~~~~
+
+XGrammar supports multi-threaded grammar compilation.
+In addition, we provide a cache in the grammar compiler to avoid
+repetitive compilation for a same grammar.
+
+To initialize a grammar compiler, we first need to obtain
+information from the target tokenizer.
+As an example, here we use the Llama-3 model tokenizer.
+
+.. code:: python
+
+  from xgrammar import TokenizerInfo
+  from transformers import AutoTokenizer
+
+  # Obtain XGrammar TokenizerInfo from HuggingFace tokenizer (once per model).
+  tokenizer = AutoTokenizer.from_pretrained("meta-llama/Meta-Llama-3-8B-Instruct")
+  tokenizer_info = TokenizerInfo.from_huggingface(tokenizer)
+
+
+Now we can create a grammar compiler :class:`xgrammar.CachedGrammarCompiler`
+and compile the constructed grammar.
+Notably, we cache all the compiled grammars, so each grammar will be compiled
+at most once.
+
+.. code:: python
+
+  from xgrammar import CachedGrammarCompiler
+
+  # Construct CachedGrammarCompiler.
+  compiler = CachedGrammarCompiler(tokenizer_info, max_threads=8)
+  # Compiler the grammar.
+  compiled_grammar = compiler.compile_json_schema(json_schema_str)
+
+
+Alternatively, we also provide the no-cache compiler, which does not
+cache grammars after compilation.
+
+.. code:: python
+
+  from xgrammar import CompiledGrammar
+
+  # Construct CompiledGrammar (no cache).
+  compiler = CompiledGrammar(tokenizer_info, max_threads=8)
+  # Compiler the grammar.
+  compiled_grammar = compiler.compile_json_schema(json_schema_str)
+
+
+
+.. _tutorial-json-generation-grammar-guided-generation:
+
+Step 3: Grammar-guided generation
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+We can now use the compiled grammar in structured generation.
+Below are two pseudo Python code examples for
+single-request generation and batch-request generation respectively.
+
+**Single-request generation.**
+
+.. code:: python
+
+  from xgrammar import GrammarMatcher
+  import torch
+
+  # Create a grammar matcher from the compiled grammar.
+  matcher = GrammarMatcher(compiled_grammar)
+
+  token_bitmask = GrammarMatcher.allocate_token_bitmask(matcher.vocab_size)
+  while True:
+      logits = LLM.inference() # logits is a tensor of shape (vocab_size,) on GPU
+      matcher.fill_next_token_bitmask(logits, token_bitmask)
+      GrammarMatcher.apply_token_bitmask_inplace(logits, token_bitmask)
+
+      prob = torch.softmax(logits, dim=-1) # get probability from logits
+      next_token_id = Sampler.sample(logits) # use your own sampler
+
+      matcher.accept_token(next_token_id)
+      if matcher.is_terminated(): # or your own termination condition
+          break
+
+
+**Batch-request generation.**
+
+.. code:: python
+
+  from xgrammar import GrammarMatcher
+  import torch
+
+  batch_size = 10
+  # Create a grammar matcher for each request.
+  matchers = [GrammarMatcher(compiled_grammar) for i in range(batch_size)]
+  token_bitmasks = GrammarMatcher.allocate_token_bitmask(matchers[0].vocab_size, batch_size)
+  while True:
+      logits = LLM.inference() # logits is a tensor of shape (batch_size, vocab_size) on GPU
+      # This for loop is parallelizable using threading.Thread. But estimate the overhead in your
+      # engine.
+      for i in range(batch_size):
+          matchers[i].fill_next_token_bitmask(token_bitmasks, i)
+      GrammarMatcher.apply_token_bitmask_inplace(logits, token_bitmasks)
+
+      prob = torch.softmax(logits, dim=-1) # get probability from logits
+      next_token_ids = Sampler.sample(logits) # use your own sampler
+
+      for i in range(batch_size):
+          matchers[i].accept_token(next_token_ids[i])
+          if matchers[i].is_terminated(): # or your own termination condition
+              requests[i].terminate()
+
diff --git a/scripts/build_site.sh b/scripts/build_site.sh
new file mode 100644
index 0000000..062f809
--- /dev/null
+++ b/scripts/build_site.sh
@@ -0,0 +1,10 @@
+#!/bin/bash
+set -euxo pipefail
+
+export PYTHONPATH=$PWD/python
+cd docs && make html && cd ..
+
+cd site && jekyll b && cd ..
+
+rm -rf site/_site/docs
+cp -r docs/_build/html site/_site/docs
diff --git a/scripts/gh_deploy_site.sh b/scripts/gh_deploy_site.sh
new file mode 100644
index 0000000..1b21c52
--- /dev/null
+++ b/scripts/gh_deploy_site.sh
@@ -0,0 +1,20 @@
+#!/bin/bash
+# NOTE: this script is triggered by github action automatically
+# when megred into main
+
+set -euxo pipefail
+
+scripts/build_site.sh
+
+git fetch
+git checkout -B gh-pages origin/gh-pages
+rm -rf docs .gitignore
+mkdir -p docs
+cp -rf site/_site/* docs
+touch docs/.nojekyll
+
+DATE=`date`
+git add docs && git commit -am "Build at ${DATE}"
+git push origin gh-pages
+git checkout main && git submodule update
+echo "Finish deployment at ${DATE}"