sqlrec
diff --git a/‎docs/.vitepress/config.mts‎
Lines changed: 60 additions & 26 deletions b/‎docs/.vitepress/config.mts‎
Lines changed: 60 additions & 26 deletions
diff --git a/‎docs/en/docs/benchmark.md‎
Lines changed: 152 additions & 0 deletions b/‎docs/en/docs/benchmark.md‎
Lines changed: 152 additions & 0 deletions
@@ -4,35 +4,69 @@ import { defineConfig } from 'vitepress'
 export default defineConfig({
   title: "SQLRec",
   description: "SQLRec docs",
-  themeConfig: {
-    // https://vitepress.dev/reference/default-theme-config
-    nav: [
-      { text: '主页', link: '/' },
-      { text: '文档', link: '/docs/intro' }
-    ],
-
-    outline: [2, 6],
-
-    sidebar: [
-        { text: '介绍', link: '/docs/intro' },
-        { text: '部署', link: '/docs/deployment' },
-        { text: '快速开始', link: '/docs/quick_start' },
-        { text: '性能测试', link: '/docs/benchmark' },
-        { text: '编程模型', link: '/docs/program_model' },
-        { text: 'SQL语法', link: '/docs/sql_reference' },
-        { text: '模型', link: '/docs/models' },
-        { text: '内置UDF', link: '/docs/udf' },
-        {
+  locales: {
+    root: {
+      label: '简体中文',
+      lang: 'zh-CN',
+      themeConfig: {
+        nav: [
+          { text: '主页', link: '/' },
+          { text: '文档', link: '/docs/intro' }
+        ],
+        outline: [2, 6],
+        sidebar: [
+          { text: '介绍', link: '/docs/intro' },
+          { text: '部署', link: '/docs/deployment' },
+          { text: '快速开始', link: '/docs/quick_start' },
+          { text: '性能测试', link: '/docs/benchmark' },
+          { text: '编程模型', link: '/docs/program_model' },
+          { text: 'SQL语法', link: '/docs/sql_reference' },
+          { text: '模型', link: '/docs/models' },
+          { text: '内置UDF', link: '/docs/udf' },
+          {
             text: '教程',
             collapsed: true,
             items: [
-                { text: '召回', link: '/docs/tutorial/recall' }
+              { text: '召回', link: '/docs/tutorial/recall' }
             ]
-        }
-    ],
-
-    socialLinks: [
-      { icon: 'github', link: 'https://github.com/sqlrec/sqlrec' }
-    ]
+          }
+        ],
+        socialLinks: [
+          { icon: 'github', link: 'https://github.com/sqlrec/sqlrec' }
+        ]
+      }
+    },
+    en: {
+      label: 'English',
+      lang: 'en-US',
+      link: '/en/',
+      themeConfig: {
+        nav: [
+          { text: 'Home', link: '/en/' },
+          { text: 'Docs', link: '/en/docs/intro' }
+        ],
+        outline: [2, 6],
+        sidebar: [
+          { text: 'Introduction', link: '/en/docs/intro' },
+          { text: 'Deployment', link: '/en/docs/deployment' },
+          { text: 'Quick Start', link: '/en/docs/quick_start' },
+          { text: 'Benchmark', link: '/en/docs/benchmark' },
+          { text: 'Programming Model', link: '/en/docs/program_model' },
+          { text: 'SQL Reference', link: '/en/docs/sql_reference' },
+          { text: 'Models', link: '/en/docs/models' },
+          { text: 'Built-in UDF', link: '/en/docs/udf' },
+          {
+            text: 'Tutorials',
+            collapsed: true,
+            items: [
+              { text: 'Recall', link: '/en/docs/tutorial/recall' }
+            ]
+          }
+        ],
+        socialLinks: [
+          { icon: 'github', link: 'https://github.com/sqlrec/sqlrec' }
+        ]
+      }
+    }
   }
 })
@@ -0,0 +1,152 @@
+# Benchmark
+
+This document introduces SQLRec performance testing methods and results.
+
+## Test Environment
+
+**Hardware Configuration**:
+- CPU: AMD Ryzen 5600H
+- Memory: 32GB DDR4
+
+**Software Environment**:
+- Operating System: Debian 12
+- Kubernetes: Minikube
+- SQLRec: Single instance deployment
+
+## Test Data
+
+Default test configuration is as follows:
+
+| Configuration Item | Value |
+|-------------------|-------|
+| Number of Users | 100,000 |
+| Number of Items | 100,000 |
+| Vector Dimension | 8 dimensions |
+| User Embedding | Fixed value |
+
+## Recommendation Pipeline
+
+The tested recommendation pipeline includes the following stages:
+
+### Recall Stage
+
+| Recall Strategy | Description | Recall Count |
+|----------------|-------------|--------------|
+| Global Hot Recall | Based on global item popularity ranking | 300 |
+| User Interest Category Recall | Recall hot items based on user interest categories | 300 |
+| ItemCF Recall | Recall based on item collaborative filtering | 300 |
+| Vector Search Recall | Based on vector similarity search | 300 |
+
+### Filtering Stage
+
+| Filtering Strategy | Description |
+|-------------------|-------------|
+| Exposure Deduplication | Filter items already exposed to users |
+| Category Diversification | Display at most N items per category |
+
+## Test Scripts
+
+### Initialize Test Environment
+
+```bash
+cd benchmark
+bash init.sh
+```
+
+The `init.sh` script performs the following operations:
+
+1. **Create Milvus Vector Collection**
+   - Create `item_embedding` collection
+   - Define vector dimension as 8
+   - Create COSINE similarity index
+
+2. **Create Data Tables**
+   - User table (`user_table`)
+   - Item table (`item_table`)
+   - Global hot items table (`global_hot_item`)
+   - User interest category table (`user_interest_category1`)
+   - Category hot items table (`category1_hot_item`)
+   - User recent clicks table (`user_recent_click_item`)
+   - User exposure table (`user_exposure_item`)
+   - ItemCF I2I table (`itemcf_i2i`)
+   - Item vector table (`item_embedding`)
+   - Recommendation log table (`rec_log_kafka`)
+
+3. **Generate Simulated Data**
+   - Use Python scripts to generate 100,000 users and 100,000 items data
+   - Generate user behavior data and upload to HDFS
+
+4. **Install Test Tools**
+   - Install wrk HTTP benchmarking tool
+
+### Execute Performance Test
+
+```bash
+bash benchmark.sh
+```
+
+The `benchmark.sh` script performs the following operations:
+
+1. **Warm-up Phase**
+   - Single thread, single connection, run for 10 seconds
+   - Warm up system cache
+
+2. **Formal Testing**
+   - Concurrency: 10
+   - Duration: 30 seconds
+   - Test URL: `/api/v1/main_rec`
+
+### Test Request Script
+
+`request.lua` is a custom request script for wrk:
+
+```lua
+-- Set random seed
+math.randomseed(os.time())
+
+function request()
+    -- Generate random ID between 0-99999
+    local random_id = math.random(0, 99999)
+    
+    -- Construct request body
+    local request_body = string.format(
+        '{"inputs":{"user_info":[{"id":%d}]},"params":{"recall_fun":"recall_fun"}}',
+        random_id
+    )
+    
+    -- Configure HTTP request
+    wrk.method = "POST"
+    wrk.headers["Content-Type"] = "application/json"
+    wrk.body = request_body
+    
+    return wrk.format()
+end
+```
+
+## Test Results
+
+Test results on AMD Ryzen 5600H, 32GB DDR4 memory machine:
+
+```
+Running 30s test @ http://192.168.49.2:30301/api/v1/main_rec
+  10 threads and 10 connections
+  Thread Stats   Avg      Stdev     Max   +/- Stdev
+    Latency    10.80ms    4.81ms  53.85ms   92.68%
+    Req/Sec    95.12     17.61   121.00     82.63%
+  28464 requests in 30.02s, 49.80MB read
+  Socket errors: connect 0, read 28463, write 0, timeout 0
+Requests/sec:    948.09
+Transfer/sec:      1.66MB
+```
+
+**Performance Metrics**:
+
+| Metric | Value |
+|--------|-------|
+| Average Latency | 10.80ms |
+| Latency Standard Deviation | 4.81ms |
+| Max Latency | 53.85ms |
+| Average QPS | 95.12 |
+| Total Requests | 28,464 |
+| Total QPS | 948.09 |
+| Throughput | 1.66MB/s |