doc: refine diagram of software architecture in toplevel README.md

zhouwg · web-flow · commit c554c74c2640 · 2025-03-08T13:02:56.000+08:00
diff --git a/README.md b/README.md
@@ -246,21 +246,21 @@ Instructions for adding support for new models: [HOWTO-add-model.md](docs/develo
 | [OpenCL](docs/backend/OPENCL.md) | Adreno GPU |
 
 ## Software architecture
-
 ```mermaid
 block-beta
 columns 1
 
 block:llamacpp
-   llamacpp["llama_cpp"]
-   style llamacpp fill:#3c3,color:#000,stroke:#000
+  llamacpp["llama_cpp"]
+  style llamacpp fill:#3c3,color:#000,stroke:#000
 end
 
-block:ggml
-   ggml["GGML"]
-   style ggml     fill:#3c3,color:#000,stroke:#000
+block:ggml_backend
+ggml_backend["GGML backend subsystem"]
+  style ggml_backend fill:#3c3,color:#000,stroke:#000
 
-   ggml_cpu["ggml-cpu"]
+block:ggmlbackends
+ ggml_cpu["ggml-cpu"]
    ggml_metal["ggml-metal"]
    ggml_sycl["ggml-sycl"]
    ggml_cuda["ggml-cuda"]
@@ -272,25 +272,43 @@ block:ggml
    ggml_nnpa["ggml-nnpa"]
    ggml_ane["ggml-ane"]
 
-   style ggml_cpu       fill:#888,color:#000,stroke:#000
-   style ggml_metal     fill:#888,color:#000,stroke:#000
-   style ggml_sycl      fill:#888,color:#000,stroke:#000
-   style ggml_cuda      fill:#888,color:#000,stroke:#000
-   style ggml_hip       fill:#888,color:#000,stroke:#000
-   style ggml_vulkan    fill:#888,color:#000,stroke:#000
-   style ggml_cann      fill:#888,color:#000,stroke:#000
+   style ggml_cpu  fill:#888,color:#000,stroke:#000
+   style ggml_metal  fill:#888,color:#000,stroke:#000
+   style ggml_sycl  fill:#888,color:#000,stroke:#000
+   style ggml_cuda fill:#888,color:#000,stroke:#000
+   style ggml_hip fill:#888,color:#000,stroke:#000
+   style ggml_vulkan  fill:#888,color:#000,stroke:#000
+   style ggml_cann  fill:#888,color:#000,stroke:#000
 
    style ggml_opencl    fill:#cc3,color:#000,stroke:#000
    style ggml_qnn       fill:#cc3,color:#000,stroke:#000
    style ggml_ane       fill:#fff,color:#000,stroke:#f00,stroke-width:2,stroke-dasharray:5
    style ggml_nnpa      fill:#cc3,color:#000,stroke:#000
+  end
 end
 
 block:ggml_pal
-   ggml_pal["GGML Platform Abstraction Layer"]
-   style ggml_pal       fill:#c33,color:#000,stroke:#000
+  ggml_pal["Platform Abstraction Layer"]
+  style ggml_pal fill:#c33,color:#000,stroke:#000
 end
 
+block:ggml_backendsubsystem
+  ggml_backendsubsystem["GGML backend subsystem"]
+  style ggml_backendsubsystem fill:#3c3,color:#000,stroke:#000
+end
+
+block:group1：2
+  columns 2
+  block:ggml_tensor
+  ggml_tensor["GGML tensor"]
+  style ggml_tensor fill:#3c3,color:#000,stroke:#000
+  end
+
+  block:ggml_cgraph
+  ggml_cgraph["GGML cgraph"]
+  style ggml_cgraph  fill:#3c3,color:#000,stroke:#000
+  end
+end
 
 block:OS
     Windows
@@ -345,11 +363,12 @@ flowchart LR
     classDef TODO fill:#c33,color:#000,stroke:#000
     classDef NEW fill:#fff,color:#000,stroke:#f00,stroke-width:2,stroke-dasharray:5
     subgraph Legend
-      direction LR
+      direction LR 
       EXIST:::EXIST ~~~ TODO:::TODO ~~~ WIP:::WIP ~~~ DONE:::DONE ~~~ NEW:::NEW
     end
 ```
 
+
 ## Building the project
 
 The main product of this project is the `llama` library. Its C-style interface can be found in [include/llama.h](include/llama.h).