quantumaikr
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 1 deletion b/‎.gitignore‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎CLAUDE.md‎
Lines changed: 5 additions & 4 deletions b/‎CLAUDE.md‎
Lines changed: 5 additions & 4 deletions
diff --git a/‎CMakeLists.txt‎
Lines changed: 2 additions & 2 deletions b/‎CMakeLists.txt‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎CONTRIBUTING.md‎
Lines changed: 8 additions & 8 deletions b/‎CONTRIBUTING.md‎
Lines changed: 8 additions & 8 deletions
diff --git a/‎Dockerfile‎
Lines changed: 5 additions & 5 deletions b/‎Dockerfile‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎Makefile‎
Lines changed: 11 additions & 11 deletions b/‎Makefile‎
Lines changed: 11 additions & 11 deletions
diff --git a/‎README.ko.md‎
Lines changed: 2 additions & 2 deletions b/‎README.ko.md‎
Lines changed: 2 additions & 2 deletions
@@ -46,7 +46,9 @@ models/.claude/worktrees/
 models/
 
 # Makefile build artifacts
-tq_run
+quant
 tq_convert
 libturboquant.a
 *.o
+tq_run
+tq_run.dSYM/
@@ -1,9 +1,10 @@
-# TurboQuant.cpp — Agent Development Guide
+# quant.cpp — Agent Development Guide
 
 ## Project Overview
 
-TurboQuant.cpp is a cross-platform C/C++ library for extreme KV cache compression in LLM inference.
-It implements PolarQuant + QJL (TurboQuant) algorithms to achieve 5x KV cache memory reduction at 3-bit with zero quality loss.
+quant.cpp is a minimal C inference engine for local LLM with KV cache compression.
+33K LOC, pure C, zero dependencies. Supports 5 architectures via GGUF.
+Killer feature: delta KV compression — 3-bit keys with PPL -3.2% vs FP32.
 
 ## Architecture
 
@@ -196,5 +197,5 @@ When merging worker results back to main:
 ./harness/run.sh --parallel-only
 
 # Manual team spawn
-clawteam launch harness/team.toml --goal "Build TurboQuant.cpp" --workspace
+clawteam launch harness/team.toml --goal "Build quant.cpp" --workspace
 ```
@@ -238,8 +238,8 @@ if(TQ_BUILD_BENCH)
 endif()
 
 # CLI inference tool
-add_executable(tq_run tools/tq_run.c)
-target_link_libraries(tq_run turboquant)
+add_executable(quant tools/quant.c)
+target_link_libraries(quant turboquant)
 
 # Debug comparison tool
 add_executable(debug_compare tools/debug_compare.c)
 
@@ -1,12 +1,12 @@
-# Contributing to TurboQuant.cpp
+# Contributing to quant.cpp
 
 Thank you for your interest in contributing! Here's how to get started.
 
 ## Quick Setup
 
 ```bash
-git clone https://github.com/quantumaikr/TurboQuant.cpp
-cd TurboQuant.cpp
+git clone https://github.com/quantumaikr/quant.cpp
+cd quant.cpp
 cmake -B build -DCMAKE_BUILD_TYPE=Debug -DTQ_BUILD_TESTS=ON
 cmake --build build -j$(nproc 2>/dev/null || sysctl -n hw.ncpu)
 ctest --test-dir build --output-on-failure
@@ -15,8 +15,8 @@ ctest --test-dir build --output-on-failure
 Or with Docker:
 
 ```bash
-docker build -t turboquant .
-docker run turboquant models/model.tqm -p "Hello" -k turbo_kv_1b
+docker build -t quant .
+docker run quant models/model.gguf -p "Hello"
 ```
 
 ## Running Tests
@@ -38,7 +38,7 @@ bash score.sh --quality    # Quantization quality metrics
 
 ## What to Work On
 
-Check [Issues](https://github.com/quantumaikr/TurboQuant.cpp/issues) for tasks labeled `good first issue` or `help wanted`.
+Check [Issues](https://github.com/quantumaikr/quant.cpp/issues) for tasks labeled `good first issue` or `help wanted`.
 
 **High-impact areas:**
 - New model architectures (Llama, Phi, Gemma)
@@ -50,7 +50,7 @@ Check [Issues](https://github.com/quantumaikr/TurboQuant.cpp/issues) for tasks l
 
 1. Add the model config struct to `include/turboquant/tq_engine.h`
 2. Implement the forward pass in `src/engine/` (one file per architecture)
-3. Register the architecture in `tq_load_model()` in `src/engine/tq_model_loader.c`
+3. Register the architecture in `tq_load_model()` in `src/engine/tq_model.c`
 4. Add a test in `tests/` and an example in `examples/`
 5. Verify with `bash score.sh --quick`
 
@@ -61,7 +61,7 @@ Check [Issues](https://github.com/quantumaikr/TurboQuant.cpp/issues) for tasks l
 3. Implement `quantize`/`dequantize`/`attention` in `src/core/tq_<name>.c`
 4. Register in the dispatch table in `src/core/tq_traits.c`
 5. Add unit tests in `tests/test_<name>.cpp`
-6. Update `tools/tq_run.c` to accept the new type name in `parse_kv_type()`
+6. Update `tools/quant.c` to accept the new type name in `parse_kv_type()`
 
 ## Code Standards
 
 
@@ -13,8 +13,8 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
     && rm -rf /var/lib/apt/lists/*
 
 # Copy project source (see .dockerignore for exclusions)
-COPY . /turboquant
-WORKDIR /turboquant
+COPY . /quant
+WORKDIR /quant
 
 # Build the library, tools, and tests
 RUN cmake -B build \
@@ -26,6 +26,6 @@ RUN cmake -B build \
 # Run the test suite
 RUN ctest --test-dir build --output-on-failure
 
-# Default entrypoint: the tq_run inference CLI
-# Usage: docker run turboquant models/model.tqm -p "Hello" -k turbo_kv_1b
-ENTRYPOINT ["./build/tq_run"]
+# Default entrypoint: the quant inference CLI
+# Usage: docker run quant models/model.gguf -p "Hello"
+ENTRYPOINT ["./build/quant"]
@@ -1,16 +1,16 @@
 # TurboQuant.cpp — Standalone Makefile (no CMake needed)
 #
 # Usage:
-#   make              # build tq_run + tq_convert
-#   make tq_run       # inference tool only
+#   make              # build quant + tq_convert
+#   make quant       # inference tool only
 #   make test         # build and run tests (requires Google Test)
 #   make clean        # remove build artifacts
 #
 # Cross-platform:
 #   Linux/gcc:     make CC=gcc
 #   macOS/clang:   make                    (auto-detects Apple Silicon)
 #   macOS+Metal:   make METAL=1            (enables Metal GPU backend)
-#   Windows/mingw: make CC=x86_64-w64-mingw32-gcc TARGET=tq_run.exe
+#   Windows/mingw: make CC=x86_64-w64-mingw32-gcc TARGET=quant.exe
 #
 # Options:
 #   DEBUG=1    — debug build (-g -O0 -fsanitize=address)
@@ -87,14 +87,14 @@ endif
 
 .PHONY: all clean test
 
-all: tq_run tq_convert
+all: quant tq_convert
 
 # Static library
 libturboquant.a: $(OBJ_LIB)
 	$(AR) rcs $@ $^
 
 # Main tools
-tq_run: tools/tq_run.c libturboquant.a
+quant: tools/quant.c libturboquant.a
 	$(CC) $(CFLAGS) -o $@ $< -L. -lturboquant $(LDFLAGS)
 
 tq_convert: tools/tq_convert.c libturboquant.a
@@ -115,12 +115,12 @@ tq_convert: tools/tq_convert.c libturboquant.a
 # Test (lightweight — no Google Test dependency)
 # ============================================================
 
-test: tq_run
+test: quant
 	@echo "=== Quick sanity test ==="
 	@echo "Building..."
-	@echo "Running tq_run --info on test..."
+	@echo "Running quant --info on test..."
 	@if [ -f model.tqm ]; then \
-		./tq_run model.tqm --info && echo "PASS: model loads" || echo "FAIL"; \
+		./quant model.tqm --info && echo "PASS: model loads" || echo "FAIL"; \
 	else \
 		echo "SKIP: no model.tqm found (download a model first)"; \
 	fi
@@ -131,7 +131,7 @@ test: tq_run
 # ============================================================
 
 clean:
-	rm -f $(OBJ_LIB) $(OBJ_METAL) libturboquant.a tq_run tq_convert
+	rm -f $(OBJ_LIB) $(OBJ_METAL) libturboquant.a quant tq_convert
 	rm -f src/**/*.o
 
 # ============================================================
@@ -142,8 +142,8 @@ help:
 	@echo "TurboQuant.cpp Makefile"
 	@echo ""
 	@echo "Targets:"
-	@echo "  make              Build tq_run + tq_convert"
-	@echo "  make tq_run       Build inference tool only"
+	@echo "  make              Build quant + tq_convert"
+	@echo "  make quant       Build inference tool only"
 	@echo "  make clean        Remove build artifacts"
 	@echo "  make test         Quick sanity test"
 	@echo "  make help         Show this help"
 
@@ -63,8 +63,8 @@ cmake -B build -DCMAKE_BUILD_TYPE=Release -DTQ_BUILD_TESTS=ON
 cmake --build build -j$(nproc)
 ctest --test-dir build   # 33/33 통과
 
-./build/tq_run model.gguf -p "Hello" -k uniform_4b -v q4   # 3.8x 압축
-./build/tq_run model.gguf --ppl input.txt -k uniform_4b -v q4  # PPL 측정
+./build/quant model.gguf -p "Hello" -k uniform_4b -v q4   # 3.8x 압축
+./build/quant model.gguf --ppl input.txt -k uniform_4b -v q4  # PPL 측정
 ```
 
 ---