From 563a7bdb18b5d766bbbf904208db4a2e74f88305 Mon Sep 17 00:00:00 2001
From: HydrogenSulfate <490868991@qq.com>
Date: Sat, 21 Dec 2024 20:21:29 +0800
Subject: [PATCH 1/8] update paddle icon and document related to paddle

---
 README.md                          |  2 +-
 doc/_static/paddle.svg             | 10 ++++
 doc/backend.md                     | 13 +++-
 doc/conf.py                        |  1 +
 doc/env.md                         | 15 +++++
 doc/freeze/freeze.md               | 23 +++++++
 doc/install/easy-install.md        | 34 +++++++++++
 doc/install/install-from-source.md | 77 +++++++++++++++++++++++-
 doc/model/dpa2.md                  |  4 +-
 doc/model/sel.md                   |  8 +++
 doc/model/train-energy.md          |  4 +-
 doc/model/train-se-atten.md        |  4 +-
 doc/model/train-se-e2-a.md         |  4 +-
 doc/train/finetuning.md            | 70 +++++++++++++++++++++-
 doc/train/parallel-training.md     | 96 +++++++++++++++++++++++++++++-
 doc/train/tensorboard.md           |  4 +-
 doc/train/training.md              |  8 +++
 17 files changed, 358 insertions(+), 19 deletions(-)
 create mode 100644 doc/_static/paddle.svg
diff --git a/README.md b/README.md
index 18bdfd6560..e374039144 100644
--- a/README.md
+++ b/README.md
@@ -19,7 +19,7 @@ For more information, check the [documentation](https://deepmd.readthedocs.io/).
 
 ### Highlighted features
 
-- **interfaced with multiple backends**, including TensorFlow, PyTorch, and JAX, the most popular deep learning frameworks, making the training process highly automatic and efficient.
+- **interfaced with multiple backends**, including TensorFlow, PyTorch, JAX and Paddle, the most popular deep learning frameworks, making the training process highly automatic and efficient.
 - **interfaced with high-performance classical MD and quantum (path-integral) MD packages**, including LAMMPS, i-PI, AMBER, CP2K, GROMACS, OpenMM, and ABACUS.
 - **implements the Deep Potential series models**, which have been successfully applied to finite and extended systems, including organic molecules, metals, semiconductors, insulators, etc.
 - **implements MPI and GPU supports**, making it highly efficient for high-performance parallel and distributed computing.
diff --git a/doc/_static/paddle.svg b/doc/_static/paddle.svg
new file mode 100644
index 0000000000..5fdd09df04
--- /dev/null
+++ b/doc/_static/paddle.svg
@@ -0,0 +1,10 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<svg version="1.1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 490 292">
+<title>PyTorch icon</title>
+<path d="M0 0 C11.88 0 23.76 0 36 0 C35.27000318 3.64998411 34.70428422 5.99468458 33.21484375 9.23046875 C32.85293945 10.02469238 32.49103516 10.81891602 32.11816406 11.63720703 C31.53373535 12.89960205 31.53373535 12.89960205 30.9375 14.1875 C30.11798199 15.9802368 29.2989825 17.77321071 28.48046875 19.56640625 C28.06587402 20.47148926 27.6512793 21.37657227 27.22412109 22.30908203 C25.04596121 27.09721092 22.93426077 31.91502758 20.82788086 36.73510742 C19.21033477 40.40215545 17.50994289 44.00421082 15.6953125 47.578125 C12.28995723 54.32802563 9.22183318 61.23012095 6.125 68.125 C5.49748056 69.51810458 4.86987589 70.91117076 4.2421875 72.30419922 C0.64924126 80.28621996 -2.91495522 88.27964026 -6.375 96.3203125 C-8.81839423 101.92413905 -11.42871097 107.45412965 -14 113 C-21.28233457 128.72765719 -28.5101696 144.47827348 -35.65991211 160.26660156 C-38.57906351 166.707749 -41.52107783 173.13622867 -44.5234375 179.5390625 C-48.04316733 187.04870569 -51.43724244 194.61205271 -54.8125 202.1875 C-55.67155954 204.11439642 -56.5310064 206.04111626 -57.39152527 207.96736145 C-58.15884503 209.68509815 -58.92480508 211.40344204 -59.69067383 213.12182617 C-60.74422081 215.43774364 -61.86215687 217.72431373 -63 220 C-74.55 220 -86.1 220 -98 220 C-97.19861794 214.39032559 -96.16832534 210.50903746 -93.83203125 205.5546875 C-93.35608772 204.51708786 -93.35608772 204.51708786 -92.87052917 203.45852661 C-91.8596761 201.25998186 -90.8363917 199.06749794 -89.8125 196.875 C-89.14434636 195.42746889 -88.47702194 193.97955473 -87.81054688 192.53125 C-86.18274474 188.99891911 -84.54553062 185.47105708 -82.90463257 181.9447937 C-78.22654638 171.88776848 -73.62649815 161.7966352 -69.0625 151.6875 C-68.75662964 151.01078247 -68.45075928 150.33406494 -68.13562012 149.63684082 C-64.09286935 140.69119079 -60.09190417 131.73053864 -56.234375 122.703125 C-55 120 -55 120 -53 117 C-78.08 117 -103.16 117 -129 117 C-130.41742912 112.74771264 -128.62707375 109.98410778 -126.9375 106.0625 C-126.64939453 105.36576172 -126.36128906 104.66902344 -126.06445312 103.95117188 C-123.32939509 97.45614112 -120.16859583 91.33719165 -117 85 C-90.93 85 -64.86 85 -38 85 C-37.01 82.03 -36.02 79.06 -35 76 C-34.04344177 73.79315778 -33.04319334 71.60473416 -32 69.4375 C-31.38565932 68.14763948 -30.77246361 66.85723325 -30.16015625 65.56640625 C-29.82129395 64.85371582 -29.48243164 64.14102539 -29.13330078 63.40673828 C-26.86113481 58.58144483 -24.6547152 53.72571929 -22.4375 48.875 C-21.47800054 46.7785836 -20.5183689 44.68222769 -19.55859375 42.5859375 C-18.88739502 41.11979004 -18.88739502 41.11979004 -18.20263672 39.62402344 C-16.8075114 36.58001067 -15.40553675 33.5392186 -14 30.5 C-9.30514288 20.34632971 -4.65895809 10.17016461 0 0 Z " fill="#000000" transform="translate(139,64)"/>
+<path d="M0 0 C11.55 0 23.1 0 35 0 C33.87539337 6.74763977 33.87539337 6.74763977 32.29296875 9.98828125 C31.95571777 10.68977295 31.6184668 11.39126465 31.27099609 12.11401367 C30.91344238 12.83951416 30.55588867 13.56501465 30.1875 14.3125 C29.45383633 15.83565309 28.72075635 17.35908748 27.98828125 18.8828125 C27.63975098 19.60243164 27.2912207 20.32205078 26.93212891 21.06347656 C23.62908381 27.9256436 20.72214954 34.97160051 17.7578125 41.984375 C15.28752453 47.70806361 12.62501403 53.34618538 10 59 C1.52356863 77.21562836 1.52356863 77.21562836 -6.62866211 95.57739258 C-8.7812196 100.54772364 -11.06030161 105.44966171 -13.37182617 110.34716797 C-15.54255113 114.96627584 -17.59973479 119.62800704 -19.625 124.3125 C-21.89331223 129.55511392 -24.28379716 134.69410683 -26.88671875 139.78125 C-28.35305192 142.70362628 -29.66883167 145.68148625 -30.98046875 148.67578125 C-33.91956109 155.37601092 -37.00300224 162.00845104 -40.125 168.625 C-43.36097884 175.51365036 -46.43854088 182.46980827 -49.5 189.4375 C-49.97252197 190.51281982 -50.44504395 191.58813965 -50.93188477 192.69604492 C-53.03389252 197.48871009 -55.12697461 202.28477065 -57.19140625 207.09375 C-57.51238281 207.83826416 -57.83335937 208.58277832 -58.1640625 209.34985352 C-58.74514438 210.70007937 -59.3222439 212.05202906 -59.89453125 213.40600586 C-61.03773657 216.0602399 -61.93426142 217.93426142 -64 220 C-66.65291757 220.17510386 -69.19986174 220.23155483 -71.8515625 220.1953125 C-73.01261002 220.19106766 -73.01261002 220.19106766 -74.19711304 220.18673706 C-76.67323157 220.17552754 -79.1489905 220.15042203 -81.625 220.125 C-83.30207812 220.11497118 -84.97916189 220.10584516 -86.65625 220.09765625 C-90.77097223 220.07558574 -94.88542511 220.04105102 -99 220 C-98.4820968 216.43822984 -97.89042588 213.2831636 -96.3984375 210.00390625 C-96.07673584 209.28831543 -95.75503418 208.57272461 -95.42358398 207.83544922 C-95.07755127 207.08537598 -94.73151855 206.33530273 -94.375 205.5625 C-94.01672119 204.77117676 -93.65844238 203.97985352 -93.28930664 203.16455078 C-90.76328299 197.60384073 -88.17801594 192.07051473 -85.57568359 186.54516602 C-83.47209495 182.06295913 -81.46917428 177.54268892 -79.5 173 C-76.14330681 165.26391494 -72.60168805 157.62454886 -69 150 C-67.96820577 147.81263633 -66.93682367 145.62507986 -65.90600586 143.43725586 C-65.2476115 142.04048695 -64.58835589 140.64412347 -63.92797852 139.24829102 C-58.61209866 127.98550461 -53.58676521 116.59211309 -48.54882812 105.203125 C-45.53599215 98.40772205 -42.45888219 91.64632977 -39.33276367 84.90234375 C-37.70341222 81.35412429 -36.15784869 77.77841203 -34.625 74.1875 C-32.24673366 68.66774722 -29.6768427 63.28654707 -26.9375 57.9375 C-24.32786036 52.83698202 -21.9978408 47.72119923 -19.9375 42.375 C-17.54828861 36.20448928 -14.75179633 30.37477233 -11.73046875 24.4921875 C-9.42010024 19.82972825 -7.42901978 15.06737681 -5.45703125 10.25390625 C-3.87468537 6.72014186 -1.92098111 3.36171695 0 0 Z " fill="#000000" transform="translate(336,64)"/>
+<path d="M0 0 C4.33750635 -0.10022677 8.67436737 -0.1720945 13.01269531 -0.21972656 C14.48286709 -0.23961976 15.95296215 -0.26674472 17.42285156 -0.30175781 C33.32207161 -0.67049825 46.65126577 3.03218991 58.98828125 13.546875 C64.81843995 19.13246683 69.36723099 24.79324465 73 32 C73.38800781 32.73863281 73.77601563 33.47726563 74.17578125 34.23828125 C80.86057999 47.92388739 79.96567138 62.64875905 76 77 C70.43092107 91.5559415 60.3572607 102.68800679 46.875 110.25 C46.30837646 110.5795166 45.74175293 110.9090332 45.15795898 111.24853516 C32.2889145 118.10851661 17.62995 117.40798722 3.5078125 117.29296875 C1.4651623 117.28736107 -0.57749199 117.28309653 -2.62014771 117.28010559 C-7.94988497 117.26874902 -13.27936997 117.23936277 -18.60900879 117.20599365 C-24.06612742 117.17509276 -29.52328752 117.16155781 -34.98046875 117.14648438 C-45.65375558 117.11448276 -56.32685667 117.06339997 -67 117 C-66.41856356 112.628168 -65.7685519 108.87766409 -64.00390625 104.828125 C-63.61009766 103.91675781 -63.21628906 103.00539063 -62.81054688 102.06640625 C-62.39869141 101.13699219 -61.98683594 100.20757812 -61.5625 99.25 C-60.95051758 97.83267578 -60.95051758 97.83267578 -60.32617188 96.38671875 C-58.7255818 92.71554477 -57.22698576 89.34047864 -55 86 C-52.47970905 85.70461401 -50.20210619 85.60390174 -47.6796875 85.63110352 C-46.9249263 85.62733704 -46.1701651 85.62357056 -45.39253235 85.61968994 C-43.74960574 85.61324415 -42.10664187 85.61359996 -40.4637146 85.61987495 C-37.85617197 85.62897194 -35.2493507 85.6187743 -32.6418457 85.60325623 C-25.22690011 85.56313942 -17.81200869 85.56194164 -10.39697266 85.56420898 C-5.86224326 85.56426035 -1.32789787 85.54495148 3.20672607 85.51487541 C5.76258908 85.50411635 8.31769705 85.51614698 10.87353516 85.52870178 C22.3800686 85.50210996 31.64478113 84.12123041 40.30859375 76 C45.54209564 69.81165596 47.51300752 61.9516166 47 54 C45.45192366 46.41808283 43.05259903 40.07316179 36.76953125 35.30859375 C26.57757869 28.75098086 16.25564196 28.64311807 4.4375 28.375 C3.03318119 28.3367343 1.62888369 28.29767788 0.22460938 28.2578125 C-3.18346604 28.16411971 -6.59154423 28.07839926 -10 28 C-11.37724797 23.86825608 -10.06802779 22.24437217 -8.3125 18.3125 C-8.03575439 17.68690186 -7.75900879 17.06130371 -7.47387695 16.41674805 C-5.44741 11.87381502 -3.25734025 7.4310753 -1 3 C-0.67 2.01 -0.34 1.02 0 0 Z " fill="#000000" transform="translate(404,64)"/>
+<path d="M0 0 C4.17677912 -0.10044978 8.35287985 -0.17219399 12.53051758 -0.21972656 C13.945356 -0.23958394 15.36011531 -0.26667966 16.7746582 -0.30175781 C34.81439134 -0.73722173 48.51740603 4.33211818 61.7421875 16.70703125 C73.69955214 28.85058323 78.24942992 43.2193673 78.1784668 60.01269531 C78.10358889 65.29919763 77.69474696 69.99603662 76 75 C75.53980469 76.37865234 75.53980469 76.37865234 75.0703125 77.78515625 C68.84699551 94.4164344 57.4915054 104.46561112 42.078125 112.45703125 C29.3879536 117.72916614 16.18834441 117.40386007 2.7265625 117.29296875 C0.70633258 117.28736088 -1.31390147 117.28309643 -3.33413696 117.28010559 C-8.60469182 117.26875047 -13.87499149 117.23936555 -19.14544678 117.20599365 C-24.54224192 117.17508955 -29.93907903 117.16155714 -35.3359375 117.14648438 C-45.89073601 117.11448534 -56.44534663 117.06340441 -67 117 C-68.28665556 112.81614624 -67.38425735 110.92963318 -65.5078125 106.95703125 C-64.96769531 105.80138672 -64.42757812 104.64574219 -63.87109375 103.45507812 C-63.28911962 102.24085804 -62.70708768 101.02666566 -62.125 99.8125 C-61.54975509 98.58706972 -60.97552443 97.36116278 -60.40234375 96.13476562 C-56.18573082 87.18573082 -56.18573082 87.18573082 -55 86 C-52.58874017 85.89626748 -50.20519852 85.85638163 -47.79321289 85.8581543 C-46.66129013 85.85294266 -46.66129013 85.85294266 -45.50650024 85.84762573 C-43.8608226 85.84025331 -42.21513492 85.83491589 -40.56944466 85.83133507 C-37.95795247 85.82417846 -35.34664917 85.80851413 -32.73521423 85.78999329 C-25.30747206 85.73751391 -17.87982749 85.68962813 -10.4519043 85.67407227 C-5.9117898 85.66393988 -1.37214189 85.63447305 3.16778755 85.59275246 C4.89275124 85.58050134 6.61778106 85.57531036 8.34278679 85.57755089 C20.12858363 85.5890819 30.48523407 85.08926252 39.53125 76.640625 C45.31754098 70.17721487 46.33114154 63.24549529 46.20703125 54.83984375 C45.59541572 46.45032501 42.16999028 40.63346938 36 35 C29.2770155 29.88567545 21.43408534 28.78469561 13.21875 28.5859375 C12.51979614 28.56657135 11.82084229 28.5472052 11.10070801 28.5272522 C8.90059036 28.4681785 6.70041828 28.42136527 4.5 28.375 C2.99477071 28.33675343 1.48956175 28.29769799 -0.015625 28.2578125 C-3.6768957 28.16253875 -7.33832122 28.07824644 -11 28 C-11.18215577 23.21738764 -9.84310886 19.91216259 -7.75 15.6875 C-7.44964844 15.06166016 -7.14929688 14.43582031 -6.83984375 13.79101562 C-4.61163361 9.16866481 -2.30087284 4.58647439 0 0 Z " fill="#000000" transform="translate(208,64)"/>
+<path d="M0 0 C5.01927615 4.07422415 8.34912066 8.03525014 9.1171875 14.640625 C9.6319714 22.61977544 7.89051051 27.70460026 2.8671875 33.890625 C-2.07316487 39.19046247 -6.64321558 40.78058204 -13.8203125 41.078125 C-20.57678033 40.86751191 -24.97772696 39.39876069 -29.890625 34.734375 C-35.8341828 28.28549447 -36.24790495 23.60312161 -36.16015625 14.90625 C-35.64367175 8.82482693 -33.41215548 4.72766408 -28.8203125 0.765625 C-19.81200761 -5.75102109 -9.40881778 -6.79308835 0 0 Z " fill="#000000" transform="translate(262.8828125,5.359375)"/>
+<path d="M0 0 C5.05658087 4.76848491 6.81082053 9.28507226 7.125 16.1875 C6.90392616 22.6516992 5.27074178 27.02114752 0.81640625 31.7265625 C-5.58312055 37.60590092 -10.62844026 39.23304049 -19.3046875 39.0625 C-25.12601004 38.45768727 -29.28998462 36.20347915 -33.125 31.8125 C-33.846875 30.801875 -34.56875 29.79125 -35.3125 28.75 C-35.84488281 28.00492188 -36.37726563 27.25984375 -36.92578125 26.4921875 C-38.65112172 23.08038748 -38.71231838 20.62212208 -38.6875 16.8125 C-38.69523437 15.62785156 -38.70296875 14.44320313 -38.7109375 13.22265625 C-38.0398399 7.37358007 -35.25212955 3.02731208 -31.3125 -1.25 C-21.27981627 -8.93460881 -9.53904896 -7.76028663 0 0 Z " fill="#000000" transform="translate(462.3125,7.25)"/>
+</svg>
diff --git a/doc/backend.md b/doc/backend.md
index 2be7ab7460..8062b623ca 100644
--- a/doc/backend.md
+++ b/doc/backend.md
@@ -5,7 +5,7 @@
 DeePMD-kit supports multiple backends: TensorFlow and PyTorch.
 To use DeePMD-kit, you must install at least one backend.
 Each backend does not support all features.
-In the documentation, TensorFlow {{ tensorflow_icon }} and PyTorch {{ pytorch_icon }} icons are used to mark whether a backend supports a feature.
+In the documentation, TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }} and Paddle {{ paddle_icon }} icons are used to mark whether a backend supports a feature.
 
 ### TensorFlow {{ tensorflow_icon }}
 
@@ -35,6 +35,15 @@ Only the `.savedmodel` format supports C++ inference, which needs the TensorFlow
 The model is device-specific, so that the model generated on the GPU device cannot be run on the CPUs.
 Currently, this backend is developed actively, and has no support for training.
 
+### Paddle {{ paddle_icon }}
+
+- Model filename extensions: `.json` and `.pdiparams`
+- Checkpoint filename extension: `.pd`
+
+[Paddle](https://www.paddlepaddle.org.cn/) version 3.0 or above is required.
+
+The `.pd` extension is used for model checkpoint storage, which is commonly utilized during training and testing in Python. The `.json` extension is for the model's computational graph in [PIR representation](https://www.paddlepaddle.org.cn/documentation/docs/zh/develop/guides/paddle_v3_features/paddle_ir_cn.html), while the `.pdiparams` extension stores model parameters. Both `.json` and `.pdiparams` files are exported together and used in model freezing and C++ inference.
+
 ### DP {{ dpmodel_icon }}
 
 :::{note}
@@ -57,7 +66,7 @@ NumPy 1.21 or above is required.
 
 ### Training
 
-When training and freezing a model, you can use `dp --tf` or `dp --pt` in the command line to switch the backend.
+When training and freezing a model, you can use `dp --tf`, `dp --pt` or `dp --pd` in the command line to switch the backend.
 
 ### Inference
 
diff --git a/doc/conf.py b/doc/conf.py
index b266126c58..52c647a20d 100644
--- a/doc/conf.py
+++ b/doc/conf.py
@@ -167,6 +167,7 @@
     "tensorflow_icon": """![TensorFlow](/_static/tensorflow.svg){class=platform-icon}""",
     "pytorch_icon": """![PyTorch](/_static/pytorch.svg){class=platform-icon}""",
     "jax_icon": """![JAX](/_static/jax.svg){class=platform-icon}""",
+    "paddle_icon": """![Paddle](/_static/paddle.svg){class=platform-icon}""",
     "dpmodel_icon": """![DP](/_static/logo_icon.svg){class=platform-icon}""",
 }
 
diff --git a/doc/env.md b/doc/env.md
index 3cf42b724a..5ff4cc695c 100644
--- a/doc/env.md
+++ b/doc/env.md
@@ -56,6 +56,21 @@ Control high (double) or low (float) precision of training.
 {{ tensorflow_icon }} Enable JIT. Note that this option may either improve or decrease the performance. Requires TensorFlow to support JIT.
 :::
 
+:::{envvar} PD_JIT
+
+**Choices**: `0`, `1`; **Default**: `0`
+
+{{ paddle_icon }} Enable Paddle JIT. Note that this option may either improve or decrease the performance.
+:::
+
+:::{envvar} PD_CINN
+
+**Choices**: `0`, `1`; **Default**: `0`
+
+{{ paddle_icon }} Enable Paddle CINN Compiler when `PD_JIT` is enabled. Note that this option may either improve or decrease the performance. Requires Paddle to support CINN()(`paddle.device.is_compiled_with_cinn()` is `True`).
+
+:::
+
 :::{envvar} DP_INFER_BATCH_SIZE
 
 **Default**: `1024` on CPUs and as maximum as possible until out-of-memory on GPUs
diff --git a/doc/freeze/freeze.md b/doc/freeze/freeze.md
index f394b64283..20f02177c6 100644
--- a/doc/freeze/freeze.md
+++ b/doc/freeze/freeze.md
@@ -32,3 +32,26 @@ $ dp --pt freeze -o model_branch1.pth --head CHOSEN_BRANCH
 ```
 
 The output model is called `model_branch1.pth`, which is the specifically frozen model with the `CHOSEN_BRANCH` head.
+
+:::
+
+:::{tab-item} Paddle {{ paddle_icon }}
+
+```bash
+$ dp --pd freeze -o model
+```
+
+in the folder where the model is trained. The output model is called `model.json` and `model.pdiparams`.
+
+In [multi-task mode](../train/multi-task-training-pd.md), you need to choose one available heads (e.g. `CHOSEN_BRANCH`) by `--head`
+to specify which model branch you want to freeze:
+
+```bash
+$ dp --pd freeze -o model_branch1 --head CHOSEN_BRANCH
+```
+
+The output model is called `model_branch1.json`, which is the specifically frozen model with the `CHOSEN_BRANCH` head.
+
+:::
+
+::::
diff --git a/doc/install/easy-install.md b/doc/install/easy-install.md
index b892463caf..0bf8f98967 100644
--- a/doc/install/easy-install.md
+++ b/doc/install/easy-install.md
@@ -186,6 +186,40 @@ Switch to the TensorFlow {{ tensorflow_icon }} tab for more information.
 
 ::::::
 
+::::::{tab-item} Paddle {{ paddle_icon }}
+
+:::::{tab-set}
+
+::::{tab-item} CUDA 12.3
+
+```bash
+pip install deepmd-kit[paddle]
+```
+
+::::
+
+::::{tab-item} CUDA 11.8
+
+```bash
+pip install paddlepaddle-gpu==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cu123/
+pip install deepmd-kit-cu11
+```
+
+::::
+
+::::{tab-item} CPU
+
+```bash
+pip install paddlepaddle-gpu==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cu118/
+pip install deepmd-kit
+```
+
+::::
+
+:::::
+
+::::::
+
 :::::::
 
 The supported platform includes Linux x86-64 and aarch64 with GNU C Library 2.28 or above, macOS x86-64 and arm64, and Windows x86-64.
diff --git a/doc/install/install-from-source.md b/doc/install/install-from-source.md
index 63060f692a..5643f6270a 100644
--- a/doc/install/install-from-source.md
+++ b/doc/install/install-from-source.md
@@ -93,6 +93,21 @@ One can also [use conda](https://docs.deepmodeling.org/faq/conda.html) to instal
 
 :::
 
+:::{tab-item} Paddle {{ paddle_icon }}
+
+To install Paddle, run
+
+```sh
+# cu123
+pip install --pre paddlepaddle-gpu -i https://www.paddlepaddle.org.cn/packages/nightly/cu123/
+# cu118
+pip install --pre paddlepaddle-gpu -i https://www.paddlepaddle.org.cn/packages/nightly/cu118/
+# cpu
+pip install --pre paddlepaddle -i https://www.paddlepaddle.org.cn/packages/nightly/cpu/
+```
+
+:::
+
 ::::
 
 It is important that every time a new shell is started and one wants to use `DeePMD-kit`, the virtual environment should be activated by
@@ -119,7 +134,7 @@ One should remember to activate the virtual environment every time he/she uses D
 
 Check the compiler version on your machine
 
-```
+```bash
 gcc --version
 ```
 
@@ -141,6 +156,12 @@ Note that PyTorch may have specific requirements for the compiler version to sup
 
 :::
 
+:::{tab-item} Paddle {{ paddle_icon }}
+
+You can set the environment variable `export DP_ENABLE_PADDLE=1` to enable customized C++ OPs in the Paddle backend.
+
+:::
+
 ::::
 
 Execute
@@ -188,6 +209,13 @@ The path to the ROCM toolkit directory. If `ROCM_ROOT` is not set, it will look
 {{ pytorch_icon }} Enable customized C++ OPs for the PyTorch backend. PyTorch can still run without customized C++ OPs, but features will be limited.
 :::
 
+:::{envvar} DP_ENABLE_PADDLE
+
+**Choices**: `0`, `1`; **Default**: `0`
+
+{{ paddle_icon }} Enable customized C++ OPs for the Paddle backend. Paddle can still run without customized C++ OPs, but features will be limited.
+:::
+
 :::{envvar} TENSORFLOW_ROOT
 
 **Type**: Path; **Default**: Detected automatically
@@ -202,6 +230,13 @@ The path to the ROCM toolkit directory. If `ROCM_ROOT` is not set, it will look
 {{ pytorch_icon }} The path to PyTorch Python library. If not given, by default, the installer only finds PyTorch under the user site-package directory (`site.getusersitepackages()`) or the system site-package directory (`sysconfig.get_path("purelib")`) due to the limitation of [PEP-517](https://peps.python.org/pep-0517/). If not found, the latest PyTorch (or the environment variable `PYTORCH_VERSION` if given) from PyPI will be built against.
 :::
 
+:::{envvar} PADDLE_INFERENCE_DIR
+
+**Type**: Path; **Default**: None
+
+{{ paddle_icon }} The path to Paddle inference library, e.g. `/path/to/paddle_inference_install_dir`. If `DP_ENABLE_PADDLE` is enabled, it needs to be specified manually; otherwise, installation will fail.
+:::
+
 :::{envvar} DP_ENABLE_NATIVE_OPTIMIZATION
 
 **Choices**: `0`, `1`; **Default**: `0`
@@ -229,7 +264,7 @@ Other [CMake environment variables](https://cmake.org/cmake/help/latest/manual/c
 
 To test the installation, one should first jump out of the source directory
 
-```
+```bash
 cd /some/other/workspace
 ```
 
@@ -325,6 +360,18 @@ download the TensorFlow C library from [this page](https://www.tensorflow.org/in
 
 :::
 
+:::{tab-item} Paddle {{ paddle_icon }}
+
+If you want to use C++ interface of Paddle, you need to compile the Paddle inference library(C++ interface) manually from the [linux-compile-by-make](https://www.paddlepaddle.org.cn/documentation/docs/zh/develop/install/compile/linux-compile-by-make.html), then use the `.so` and `.a` files in `Paddle/build/paddle_inference_install_dir/`.
+
+We also provide a nightly pre-compiled Paddle C++ library for Linux x86_64 with CUDA 11.8/12.3 below:
+
+[Cuda118_cudnn860_Trt8531_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cuda118_cudnn860_Trt8531_D1/latest/paddle_inference.tgz)
+
+[Cuda123_cudnn900_Trt8616_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cuda123_cudnn900_Trt8616_D1/latest/paddle_inference.tgz)
+
+:::
+
 ::::
 
 ### Install DeePMD-kit's C++ interface
@@ -389,6 +436,16 @@ cmake -DENABLE_JAX=ON -D CMAKE_PREFIX_PATH=${tensorflow_c_root} ..
 
 :::
 
+:::{tab-item} Paddle {{ paddle_icon }}
+
+I assume you have get the Paddle inference library(C++ interface) to `$PADDLE_INFERENCE_DIR`, then execute CMake
+
+```bash
+cmake -DENABLE_PADDLE=ON -DPADDLE_INFERENCE_DIR=$PADDLE_INFERENCE_DIR -DCMAKE_INSTALL_PREFIX=$deepmd_root ..
+```
+
+:::
+
 ::::
 
 One may add the following CMake variables to `cmake` using the [`-D <var>=<value>` option](https://cmake.org/cmake/help/latest/manual/cmake.1.html#cmdoption-cmake-D):
@@ -420,6 +477,14 @@ If {cmake:variable}`ENABLE_TENSORFLOW` is `OFF`, the TensorFlow C library is use
 
 :::
 
+:::{cmake:variable} ENABLE_PADDLE
+
+**Type**: `BOOL` (`ON`/`OFF`), Default: `OFF`
+
+{{ paddle_icon }} Whether building the Paddle backend.
+
+:::
+
 :::{cmake:variable} TENSORFLOW_ROOT
 
 **Type**: `PATH`
@@ -428,6 +493,14 @@ If {cmake:variable}`ENABLE_TENSORFLOW` is `OFF`, the TensorFlow C library is use
 
 :::
 
+:::{cmake:variable} PADDLE_INFERENCE_DIR
+
+**Type**: `PATH`
+
+{{ paddle_icon }} The Path to Paddle's C++ inference directory, such as `/path/to/paddle_inference_install_dir` or `/path/to/paddle_inference`.
+
+:::
+
 :::{cmake:variable} CMAKE_INSTALL_PREFIX
 
 **Type**: `PATH`
diff --git a/doc/model/dpa2.md b/doc/model/dpa2.md
index eb641d6b01..70c9fee9d5 100644
--- a/doc/model/dpa2.md
+++ b/doc/model/dpa2.md
@@ -1,7 +1,7 @@
-# Descriptor DPA-2 {{ pytorch_icon }} {{ jax_icon }} {{ dpmodel_icon }}
+# Descriptor DPA-2 {{ pytorch_icon }} {{ jax_icon }} {{ paddle_icon }} {{ dpmodel_icon }}
 
 :::{note}
-**Supported backends**: PyTorch {{ pytorch_icon }}, JAX {{ jax_icon }}, DP {{ dpmodel_icon }}
+**Supported backends**: PyTorch {{ pytorch_icon }}, JAX {{ jax_icon }}, Paddle {{ paddle_icon }}, DP {{ dpmodel_icon }}
 :::
 
 The DPA-2 model implementation. See https://arxiv.org/abs/2312.15492 for more details.
diff --git a/doc/model/sel.md b/doc/model/sel.md
index babea1d463..5b85318dd9 100644
--- a/doc/model/sel.md
+++ b/doc/model/sel.md
@@ -32,6 +32,14 @@ dp --jax neighbor-stat -s data -r 6.0 -t O H
 
 :::
 
+:::{tab-item} Paddle {{ paddle_icon }}
+
+```sh
+dp --pd neighbor-stat -s data -r 6.0 -t O H
+```
+
+:::
+
 ::::
 
 where `data` is the directory of data, `6.0` is the cutoff radius, and `O` and `H` is the type map. The program will give the `max_nbor_size`. For example, `max_nbor_size` of the water example is `[38, 72]`, meaning an atom may have 38 O neighbors and 72 H neighbors in the training data.
diff --git a/doc/model/train-energy.md b/doc/model/train-energy.md
index 484564b14f..128779ee16 100644
--- a/doc/model/train-energy.md
+++ b/doc/model/train-energy.md
@@ -1,7 +1,7 @@
-# Fit energy {{ tensorflow_icon }} {{ pytorch_icon }} {{ jax_icon }} {{ dpmodel_icon }}
+# Fit energy {{ tensorflow_icon }} {{ pytorch_icon }} {{ jax_icon }} {{ paddle_icon }} {{ dpmodel_icon }}
 
 :::{note}
-**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, JAX {{ jax_icon }}, DP {{ dpmodel_icon }}
+**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, JAX {{ jax_icon }}, Paddle {{ paddle_icon }}, DP {{ dpmodel_icon }}
 :::
 
 In this section, we will take `$deepmd_source_dir/examples/water/se_e2_a/input.json` as an example of the input file.
diff --git a/doc/model/train-se-atten.md b/doc/model/train-se-atten.md
index 92a56395f6..5b9e4d7e4a 100644
--- a/doc/model/train-se-atten.md
+++ b/doc/model/train-se-atten.md
@@ -1,7 +1,7 @@
-# Descriptor `"se_atten"` {{ tensorflow_icon }} {{ pytorch_icon }} {{ jax_icon }} {{ dpmodel_icon }}
+# Descriptor `"se_atten"` {{ tensorflow_icon }} {{ pytorch_icon }} {{ jax_icon }} {{ paddle_icon }} {{ dpmodel_icon }}
 
 :::{note}
-**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, JAX {{ jax_icon }}, DP {{ dpmodel_icon }}
+**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, JAX {{ jax_icon }}, Paddle {{ paddle_icon }}, DP {{ dpmodel_icon }}
 :::
 
 ![ALT](../images/model_se_atten.png "model_se_atten")
diff --git a/doc/model/train-se-e2-a.md b/doc/model/train-se-e2-a.md
index 5143d5b5fb..9382c78d8e 100644
--- a/doc/model/train-se-e2-a.md
+++ b/doc/model/train-se-e2-a.md
@@ -1,7 +1,7 @@
-# Descriptor `"se_e2_a"` {{ tensorflow_icon }} {{ pytorch_icon }} {{ jax_icon }} {{ dpmodel_icon }}
+# Descriptor `"se_e2_a"` {{ tensorflow_icon }} {{ pytorch_icon }} {{ jax_icon }} {{ paddle_icon }} {{ dpmodel_icon }}
 
 :::{note}
-**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, JAX {{ jax_icon }}, DP {{ dpmodel_icon }}
+**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, JAX {{ jax_icon }}, Paddle {{ paddle_icon }}, DP {{ dpmodel_icon }}
 :::
 
 The notation of `se_e2_a` is short for the Deep Potential Smooth Edition (DeepPot-SE) constructed from all information (both angular and radial) of atomic configurations. The `e2` stands for the embedding with two-atoms information. This descriptor was described in detail in [the DeepPot-SE paper](https://arxiv.org/abs/1805.09003).
diff --git a/doc/train/finetuning.md b/doc/train/finetuning.md
index cf2f5fde4f..d7175121d6 100644
--- a/doc/train/finetuning.md
+++ b/doc/train/finetuning.md
@@ -1,7 +1,7 @@
-# Finetune the pre-trained model {{ tensorflow_icon }} {{ pytorch_icon }}
+# Finetune the pre-trained model {{ tensorflow_icon }} {{ pytorch_icon }} {{ paddle_icon }}
 
 :::{note}
-**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}
+**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, Paddle {{ paddle_icon }}
 :::
 
 Pretraining-and-finetuning is a widely used approach in other fields such as Computer Vision (CV) or Natural Language Processing (NLP)
@@ -196,3 +196,69 @@ This will initiate multitask fine-tuning, where for branches `PRE_DATA1` and `PR
 it is akin to continuing training in `init-model` mode, whereas for `DOWNSTREAM_DATA`,
 fine-tuning will be based on the fitting net from `PRE_DATA1`.
 You can set `model_prob` for each dataset just the same as that in normal multitask training.
+
+## Paddle Implementation {{ paddle_icon }}
+
+In Paddle version, we have introduced an updated, more adaptable approach to fine-tuning. This methodology encompasses two primary variations:
+
+### Single-task fine-tuning
+
+#### Fine-tuning from a single-task pre-trained model
+
+By saying "single-task pre-trained", we refer to a model pre-trained on one single dataset.
+This fine-tuning method is similar to the fine-tune approach supported by TensorFlow.
+It utilizes a single-task pre-trained model (`pretrained.pd`) and modifies the energy bias within its fitting net before continuing with training.
+The command for this operation is:
+
+```bash
+$ dp --pd train input.json --finetune pretrained.pd
+```
+
+In this case, it is important to note that the fitting net weights, except the energy bias, will be automatically set to those in the pre-trained model. This default setting is consistent with the implementations in TensorFlow.
+If you wish to conduct fine-tuning using a randomly initialized fitting net in this scenario, you can manually adjust the `--model-branch` parameter to "RANDOM":
+
+```bash
+$ dp --pd train input.json --finetune pretrained.pd --model-branch RANDOM
+```
+
+The model section in input.json **must be the same as that in the pretrained model**.
+If you do not know the model params in the pretrained model, you can add `--use-pretrain-script` in the fine-tuning command:
+
+```bash
+$ dp --pd train input.json --finetune pretrained.pd --use-pretrain-script
+```
+
+The model section will be overwritten (except the `type_map` subsection) by that in the pretrained model and then the input.json can be simplified as follows:
+
+```json
+    "model": {
+        "type_map":     ["O", "H"],
+        "descriptor" :  {},
+        "fitting_net" : {}
+    }
+```
+
+#### Fine-tuning from a multi-task pre-trained model
+
+Additionally, within the Paddle implementation and leveraging the flexibility offered by the framework and the multi-task training process proposed in DPA2 [paper](https://arxiv.org/abs/2312.15492),
+we also support more general multitask pre-trained models, which includes multiple datasets for pre-training. These pre-training datasets share a common descriptor while maintaining their individual fitting nets,
+as detailed in the paper above.
+
+For fine-tuning using this multitask pre-trained model (`multitask_pretrained.pd`),
+one can select a specific branch (e.g., `CHOOSEN_BRANCH`) included in `multitask_pretrained.pd` for fine-tuning with the following command:
+
+```bash
+$ dp --pd train input.json --finetune multitask_pretrained.pd --model-branch CHOOSEN_BRANCH
+```
+
+:::{note}
+One can check the available model branches in multi-task pre-trained model by refering to the documentation of the pre-trained model or by using the following command:
+
+```bash
+$ dp --pd show multitask_pretrained.pd model-branch
+```
+
+:::
+
+This command will start fine-tuning based on the pre-trained model's descriptor and the selected branch's fitting net.
+If --model-branch is not set or set to "RANDOM", a randomly initialized fitting net will be used.
diff --git a/doc/train/parallel-training.md b/doc/train/parallel-training.md
index 9ea92b4751..4a94ee5e26 100644
--- a/doc/train/parallel-training.md
+++ b/doc/train/parallel-training.md
@@ -1,7 +1,7 @@
-# Parallel training {{ tensorflow_icon }} {{ pytorch_icon }}
+# Parallel training {{ tensorflow_icon }} {{ pytorch_icon }} {{ paddle_icon }}
 
 :::{note}
-**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}
+**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, Paddle {{ paddle_icon }}
 :::
 
 ## TensorFlow Implementation {{ tensorflow_icon }}
@@ -187,3 +187,95 @@ torchrun --rdzv_endpoint=node0:12321 --nnodes=2 --nproc_per_node=4 --node_rank=1
 > **Note** for developers: `torchrun` by default passes settings as environment variables [(list here)](https://pytorch.org/docs/stable/elastic/run.html#environment-variables).
 
 > To check forward, backward, and communication time, please set env var `TORCH_CPP_LOG_LEVEL=INFO TORCH_DISTRIBUTED_DEBUG=DETAIL`. More details can be found [here](https://pytorch.org/docs/stable/distributed.html#logging).
+
+## Paddle Implementation {{ paddle_icon }}
+
+Currently, parallel training in paddle version is implemented in the form of Paddle Distributed Data Parallelism [DDP](https://www.paddlepaddle.org.cn/documentation/docs/zh/develop/guides/06_distributed_training/cluster_quick_start_collective_cn.html).
+DeePMD-kit will decide whether to launch the training in parallel (distributed) mode or in serial mode depending on your execution command.
+
+### Dataloader and Dataset
+
+First, we establish a DeepmdData class for each system, which is consistent with the TensorFlow version in this level. Then, we create a dataloader for each system, resulting in the same number of dataloaders as the number of systems. Next, we create a dataset for the dataloaders obtained in the previous step. This allows us to query the data for each system through this dataset, while the iteration pointers for each system are maintained by their respective dataloaders. Finally, a dataloader is created for the outermost dataset.
+
+We achieve custom sampling methods using a weighted sampler. The length of the sampler is set to total_batch_num \* num_workers.The parameter "num_workers" defines the number of threads involved in multi-threaded loading, which can be modified by setting the environment variable NUM_WORKERS (default: min(8, ncpus)).
+
+> **Note** The underlying dataloader will use a distributed sampler to ensure that each GPU receives batches with different content in parallel mode, which will use sequential sampler in serial mode. In the TensorFlow version, Horovod shuffles the dataset using different random seeds for the same purpose..
+
+```mermaid
+flowchart LR
+    subgraph systems
+        subgraph system1
+            direction LR
+            frame1[frame 1]
+            frame2[frame 2]
+        end
+        subgraph system2
+            direction LR
+            frame3[frame 3]
+            frame4[frame 4]
+            frame5[frame 5]
+        end
+    end
+    subgraph dataset
+        dataset1[dataset 1]
+        dataset2[dataset 2]
+    end
+    system1 -- frames --> dataset1
+    system2 --> dataset2
+    subgraph distribted sampler
+        ds1[distributed sampler 1]
+        ds2[distributed sampler 2]
+    end
+    dataset1 --> ds1
+    dataset2 --> ds2
+    subgraph dataloader
+        dataloader1[dataloader 1]
+        dataloader2[dataloader 2]
+    end
+    ds1 -- mini batch --> dataloader1
+    ds2 --> dataloader2
+    subgraph index[index on Rank 0]
+        dl11[dataloader 1, entry 1]
+        dl21[dataloader 2, entry 1]
+        dl22[dataloader 2, entry 2]
+    end
+    dataloader1 --> dl11
+    dataloader2 --> dl21
+    dataloader2 --> dl22
+    index -- for each step, choose 1 system --> WeightedSampler
+    --> dploaderset --> bufferedq[buffered queue] --> model
+```
+
+### How to use
+
+We use [`paddle.distributed.fleet`](https://www.paddlepaddle.org.cn/documentation/docs/zh/guides/06_distributed_training/cluster_quick_start_collective_cn.html) to launch a DDP training session.
+
+To start training with multiple GPUs in one node, set environment variable `CUDA_VISIBLE_DEVICES` as the list of GPUs you want to use:
+
+```bash
+# example for training with 4 gpus in one node
+NUM_WORKERS=0 HDF5_USE_FILE_LOCKING=0 CUDA_VISIBLE_DEVICES=0,1,2,3 python -m paddle.distributed.launch --gpus="0,1,2,3" dp --pd train input.json
+```
+
+Suppose you have 2 nodes each with 4 GPUs and their ip address are: `192.168.1.2` and `192.168.1.3`, then you can use `paddle.distributed.launch` to launch a DDP training session:
+
+```bash
+# run in node 192.168.1.2
+NUM_WORKERS=0 HDF5_USE_FILE_LOCKING=0 python -m paddle.distributed.launch \
+    --gpus=0,1,2,3 \
+    --ips=192.168.1.2,192.168.1.3 \
+    dp --pd train input.json
+
+# then run in the other node 192.168.1.3
+NUM_WORKERS=0 HDF5_USE_FILE_LOCKING=0 python -m paddle.distributed.launch \
+    --gpus=0,1,2,3 \
+    --ips=192.168.1.2,192.168.1.3 \
+    dp --pd train input.json
+```
+
+:::{note}
+
+If `NUM_WORKERS` is too large, it may cause the program to be terminated by the system;
+if it is too small, it may slow down data reading. You can try adjusting it to an appropriate size.
+
+:::
diff --git a/doc/train/tensorboard.md b/doc/train/tensorboard.md
index 32ecdd0ab2..3925ab3d3d 100644
--- a/doc/train/tensorboard.md
+++ b/doc/train/tensorboard.md
@@ -1,7 +1,7 @@
-# TensorBoard Usage {{ tensorflow_icon }} {{ pytorch_icon }}
+# TensorBoard Usage {{ tensorflow_icon }} {{ pytorch_icon }} {{ paddle_icon }}
 
 :::{note}
-**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}
+**Supported backends**: TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, Paddle {{ paddle_icon }}
 :::
 
 TensorBoard provides the visualization and tooling needed for machine learning
diff --git a/doc/train/training.md b/doc/train/training.md
index 5e8f8db498..8f491cc7a8 100644
--- a/doc/train/training.md
+++ b/doc/train/training.md
@@ -26,6 +26,14 @@ $ dp --pt train input.json
 
 :::
 
+:::{tab-item} Paddle {{ paddle_icon }}
+
+```bash
+$ dp --pd train input.json
+```
+
+:::
+
 ::::
 
 where `input.json` is the name of the input script.

From c7b21f8d62cd430ccda4ffda2f90589d14e7fbf9 Mon Sep 17 00:00:00 2001
From: HydrogenSulfate <490868991@qq.com>
Date: Thu, 26 Dec 2024 13:47:30 +0800
Subject: [PATCH 2/8] Update README.md

Co-authored-by: Jinzhe Zeng <jinzhe.zeng@rutgers.edu>
Signed-off-by: HydrogenSulfate <490868991@qq.com>
---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index e374039144..2af98f3057 100644
--- a/README.md
+++ b/README.md
@@ -19,7 +19,7 @@ For more information, check the [documentation](https://deepmd.readthedocs.io/).
 
 ### Highlighted features
 
-- **interfaced with multiple backends**, including TensorFlow, PyTorch, JAX and Paddle, the most popular deep learning frameworks, making the training process highly automatic and efficient.
+- **interfaced with multiple backends**, including TensorFlow, PyTorch, JAX, and Paddle, the most popular deep learning frameworks, making the training process highly automatic and efficient.
 - **interfaced with high-performance classical MD and quantum (path-integral) MD packages**, including LAMMPS, i-PI, AMBER, CP2K, GROMACS, OpenMM, and ABACUS.
 - **implements the Deep Potential series models**, which have been successfully applied to finite and extended systems, including organic molecules, metals, semiconductors, insulators, etc.
 - **implements MPI and GPU supports**, making it highly efficient for high-performance parallel and distributed computing.

From ea1bfe18fcc4731b8ea1d9b07dbe9af490232e2c Mon Sep 17 00:00:00 2001
From: HydrogenSulfate <490868991@qq.com>
Date: Thu, 26 Dec 2024 13:47:39 +0800
Subject: [PATCH 3/8] Update doc/_static/paddle.svg

Co-authored-by: Jinzhe Zeng <jinzhe.zeng@rutgers.edu>
Signed-off-by: HydrogenSulfate <490868991@qq.com>
---
 doc/_static/paddle.svg | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/doc/_static/paddle.svg b/doc/_static/paddle.svg
index 5fdd09df04..1b7be12e3e 100644
--- a/doc/_static/paddle.svg
+++ b/doc/_static/paddle.svg
@@ -1,6 +1,6 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <svg version="1.1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 490 292">
-<title>PyTorch icon</title>
+<title>Paddle icon</title>
 <path d="M0 0 C11.88 0 23.76 0 36 0 C35.27000318 3.64998411 34.70428422 5.99468458 33.21484375 9.23046875 C32.85293945 10.02469238 32.49103516 10.81891602 32.11816406 11.63720703 C31.53373535 12.89960205 31.53373535 12.89960205 30.9375 14.1875 C30.11798199 15.9802368 29.2989825 17.77321071 28.48046875 19.56640625 C28.06587402 20.47148926 27.6512793 21.37657227 27.22412109 22.30908203 C25.04596121 27.09721092 22.93426077 31.91502758 20.82788086 36.73510742 C19.21033477 40.40215545 17.50994289 44.00421082 15.6953125 47.578125 C12.28995723 54.32802563 9.22183318 61.23012095 6.125 68.125 C5.49748056 69.51810458 4.86987589 70.91117076 4.2421875 72.30419922 C0.64924126 80.28621996 -2.91495522 88.27964026 -6.375 96.3203125 C-8.81839423 101.92413905 -11.42871097 107.45412965 -14 113 C-21.28233457 128.72765719 -28.5101696 144.47827348 -35.65991211 160.26660156 C-38.57906351 166.707749 -41.52107783 173.13622867 -44.5234375 179.5390625 C-48.04316733 187.04870569 -51.43724244 194.61205271 -54.8125 202.1875 C-55.67155954 204.11439642 -56.5310064 206.04111626 -57.39152527 207.96736145 C-58.15884503 209.68509815 -58.92480508 211.40344204 -59.69067383 213.12182617 C-60.74422081 215.43774364 -61.86215687 217.72431373 -63 220 C-74.55 220 -86.1 220 -98 220 C-97.19861794 214.39032559 -96.16832534 210.50903746 -93.83203125 205.5546875 C-93.35608772 204.51708786 -93.35608772 204.51708786 -92.87052917 203.45852661 C-91.8596761 201.25998186 -90.8363917 199.06749794 -89.8125 196.875 C-89.14434636 195.42746889 -88.47702194 193.97955473 -87.81054688 192.53125 C-86.18274474 188.99891911 -84.54553062 185.47105708 -82.90463257 181.9447937 C-78.22654638 171.88776848 -73.62649815 161.7966352 -69.0625 151.6875 C-68.75662964 151.01078247 -68.45075928 150.33406494 -68.13562012 149.63684082 C-64.09286935 140.69119079 -60.09190417 131.73053864 -56.234375 122.703125 C-55 120 -55 120 -53 117 C-78.08 117 -103.16 117 -129 117 C-130.41742912 112.74771264 -128.62707375 109.98410778 -126.9375 106.0625 C-126.64939453 105.36576172 -126.36128906 104.66902344 -126.06445312 103.95117188 C-123.32939509 97.45614112 -120.16859583 91.33719165 -117 85 C-90.93 85 -64.86 85 -38 85 C-37.01 82.03 -36.02 79.06 -35 76 C-34.04344177 73.79315778 -33.04319334 71.60473416 -32 69.4375 C-31.38565932 68.14763948 -30.77246361 66.85723325 -30.16015625 65.56640625 C-29.82129395 64.85371582 -29.48243164 64.14102539 -29.13330078 63.40673828 C-26.86113481 58.58144483 -24.6547152 53.72571929 -22.4375 48.875 C-21.47800054 46.7785836 -20.5183689 44.68222769 -19.55859375 42.5859375 C-18.88739502 41.11979004 -18.88739502 41.11979004 -18.20263672 39.62402344 C-16.8075114 36.58001067 -15.40553675 33.5392186 -14 30.5 C-9.30514288 20.34632971 -4.65895809 10.17016461 0 0 Z " fill="#000000" transform="translate(139,64)"/>
 <path d="M0 0 C11.55 0 23.1 0 35 0 C33.87539337 6.74763977 33.87539337 6.74763977 32.29296875 9.98828125 C31.95571777 10.68977295 31.6184668 11.39126465 31.27099609 12.11401367 C30.91344238 12.83951416 30.55588867 13.56501465 30.1875 14.3125 C29.45383633 15.83565309 28.72075635 17.35908748 27.98828125 18.8828125 C27.63975098 19.60243164 27.2912207 20.32205078 26.93212891 21.06347656 C23.62908381 27.9256436 20.72214954 34.97160051 17.7578125 41.984375 C15.28752453 47.70806361 12.62501403 53.34618538 10 59 C1.52356863 77.21562836 1.52356863 77.21562836 -6.62866211 95.57739258 C-8.7812196 100.54772364 -11.06030161 105.44966171 -13.37182617 110.34716797 C-15.54255113 114.96627584 -17.59973479 119.62800704 -19.625 124.3125 C-21.89331223 129.55511392 -24.28379716 134.69410683 -26.88671875 139.78125 C-28.35305192 142.70362628 -29.66883167 145.68148625 -30.98046875 148.67578125 C-33.91956109 155.37601092 -37.00300224 162.00845104 -40.125 168.625 C-43.36097884 175.51365036 -46.43854088 182.46980827 -49.5 189.4375 C-49.97252197 190.51281982 -50.44504395 191.58813965 -50.93188477 192.69604492 C-53.03389252 197.48871009 -55.12697461 202.28477065 -57.19140625 207.09375 C-57.51238281 207.83826416 -57.83335937 208.58277832 -58.1640625 209.34985352 C-58.74514438 210.70007937 -59.3222439 212.05202906 -59.89453125 213.40600586 C-61.03773657 216.0602399 -61.93426142 217.93426142 -64 220 C-66.65291757 220.17510386 -69.19986174 220.23155483 -71.8515625 220.1953125 C-73.01261002 220.19106766 -73.01261002 220.19106766 -74.19711304 220.18673706 C-76.67323157 220.17552754 -79.1489905 220.15042203 -81.625 220.125 C-83.30207812 220.11497118 -84.97916189 220.10584516 -86.65625 220.09765625 C-90.77097223 220.07558574 -94.88542511 220.04105102 -99 220 C-98.4820968 216.43822984 -97.89042588 213.2831636 -96.3984375 210.00390625 C-96.07673584 209.28831543 -95.75503418 208.57272461 -95.42358398 207.83544922 C-95.07755127 207.08537598 -94.73151855 206.33530273 -94.375 205.5625 C-94.01672119 204.77117676 -93.65844238 203.97985352 -93.28930664 203.16455078 C-90.76328299 197.60384073 -88.17801594 192.07051473 -85.57568359 186.54516602 C-83.47209495 182.06295913 -81.46917428 177.54268892 -79.5 173 C-76.14330681 165.26391494 -72.60168805 157.62454886 -69 150 C-67.96820577 147.81263633 -66.93682367 145.62507986 -65.90600586 143.43725586 C-65.2476115 142.04048695 -64.58835589 140.64412347 -63.92797852 139.24829102 C-58.61209866 127.98550461 -53.58676521 116.59211309 -48.54882812 105.203125 C-45.53599215 98.40772205 -42.45888219 91.64632977 -39.33276367 84.90234375 C-37.70341222 81.35412429 -36.15784869 77.77841203 -34.625 74.1875 C-32.24673366 68.66774722 -29.6768427 63.28654707 -26.9375 57.9375 C-24.32786036 52.83698202 -21.9978408 47.72119923 -19.9375 42.375 C-17.54828861 36.20448928 -14.75179633 30.37477233 -11.73046875 24.4921875 C-9.42010024 19.82972825 -7.42901978 15.06737681 -5.45703125 10.25390625 C-3.87468537 6.72014186 -1.92098111 3.36171695 0 0 Z " fill="#000000" transform="translate(336,64)"/>
 <path d="M0 0 C4.33750635 -0.10022677 8.67436737 -0.1720945 13.01269531 -0.21972656 C14.48286709 -0.23961976 15.95296215 -0.26674472 17.42285156 -0.30175781 C33.32207161 -0.67049825 46.65126577 3.03218991 58.98828125 13.546875 C64.81843995 19.13246683 69.36723099 24.79324465 73 32 C73.38800781 32.73863281 73.77601563 33.47726563 74.17578125 34.23828125 C80.86057999 47.92388739 79.96567138 62.64875905 76 77 C70.43092107 91.5559415 60.3572607 102.68800679 46.875 110.25 C46.30837646 110.5795166 45.74175293 110.9090332 45.15795898 111.24853516 C32.2889145 118.10851661 17.62995 117.40798722 3.5078125 117.29296875 C1.4651623 117.28736107 -0.57749199 117.28309653 -2.62014771 117.28010559 C-7.94988497 117.26874902 -13.27936997 117.23936277 -18.60900879 117.20599365 C-24.06612742 117.17509276 -29.52328752 117.16155781 -34.98046875 117.14648438 C-45.65375558 117.11448276 -56.32685667 117.06339997 -67 117 C-66.41856356 112.628168 -65.7685519 108.87766409 -64.00390625 104.828125 C-63.61009766 103.91675781 -63.21628906 103.00539063 -62.81054688 102.06640625 C-62.39869141 101.13699219 -61.98683594 100.20757812 -61.5625 99.25 C-60.95051758 97.83267578 -60.95051758 97.83267578 -60.32617188 96.38671875 C-58.7255818 92.71554477 -57.22698576 89.34047864 -55 86 C-52.47970905 85.70461401 -50.20210619 85.60390174 -47.6796875 85.63110352 C-46.9249263 85.62733704 -46.1701651 85.62357056 -45.39253235 85.61968994 C-43.74960574 85.61324415 -42.10664187 85.61359996 -40.4637146 85.61987495 C-37.85617197 85.62897194 -35.2493507 85.6187743 -32.6418457 85.60325623 C-25.22690011 85.56313942 -17.81200869 85.56194164 -10.39697266 85.56420898 C-5.86224326 85.56426035 -1.32789787 85.54495148 3.20672607 85.51487541 C5.76258908 85.50411635 8.31769705 85.51614698 10.87353516 85.52870178 C22.3800686 85.50210996 31.64478113 84.12123041 40.30859375 76 C45.54209564 69.81165596 47.51300752 61.9516166 47 54 C45.45192366 46.41808283 43.05259903 40.07316179 36.76953125 35.30859375 C26.57757869 28.75098086 16.25564196 28.64311807 4.4375 28.375 C3.03318119 28.3367343 1.62888369 28.29767788 0.22460938 28.2578125 C-3.18346604 28.16411971 -6.59154423 28.07839926 -10 28 C-11.37724797 23.86825608 -10.06802779 22.24437217 -8.3125 18.3125 C-8.03575439 17.68690186 -7.75900879 17.06130371 -7.47387695 16.41674805 C-5.44741 11.87381502 -3.25734025 7.4310753 -1 3 C-0.67 2.01 -0.34 1.02 0 0 Z " fill="#000000" transform="translate(404,64)"/>

From 7c77e7f2ea59428fff988370160b58546f9cb74b Mon Sep 17 00:00:00 2001
From: HydrogenSulfate <490868991@qq.com>
Date: Thu, 26 Dec 2024 13:49:51 +0800
Subject: [PATCH 4/8] remove duplicated content in parallel-training.md

---
 doc/train/parallel-training.md | 56 ----------------------------------
 1 file changed, 56 deletions(-)

diff --git a/doc/train/parallel-training.md b/doc/train/parallel-training.md
index 4a94ee5e26..f06c359ffb 100644
--- a/doc/train/parallel-training.md
+++ b/doc/train/parallel-training.md
@@ -190,62 +190,6 @@ torchrun --rdzv_endpoint=node0:12321 --nnodes=2 --nproc_per_node=4 --node_rank=1
 
 ## Paddle Implementation {{ paddle_icon }}
 
-Currently, parallel training in paddle version is implemented in the form of Paddle Distributed Data Parallelism [DDP](https://www.paddlepaddle.org.cn/documentation/docs/zh/develop/guides/06_distributed_training/cluster_quick_start_collective_cn.html).
-DeePMD-kit will decide whether to launch the training in parallel (distributed) mode or in serial mode depending on your execution command.
-
-### Dataloader and Dataset
-
-First, we establish a DeepmdData class for each system, which is consistent with the TensorFlow version in this level. Then, we create a dataloader for each system, resulting in the same number of dataloaders as the number of systems. Next, we create a dataset for the dataloaders obtained in the previous step. This allows us to query the data for each system through this dataset, while the iteration pointers for each system are maintained by their respective dataloaders. Finally, a dataloader is created for the outermost dataset.
-
-We achieve custom sampling methods using a weighted sampler. The length of the sampler is set to total_batch_num \* num_workers.The parameter "num_workers" defines the number of threads involved in multi-threaded loading, which can be modified by setting the environment variable NUM_WORKERS (default: min(8, ncpus)).
-
-> **Note** The underlying dataloader will use a distributed sampler to ensure that each GPU receives batches with different content in parallel mode, which will use sequential sampler in serial mode. In the TensorFlow version, Horovod shuffles the dataset using different random seeds for the same purpose..
-
-```mermaid
-flowchart LR
-    subgraph systems
-        subgraph system1
-            direction LR
-            frame1[frame 1]
-            frame2[frame 2]
-        end
-        subgraph system2
-            direction LR
-            frame3[frame 3]
-            frame4[frame 4]
-            frame5[frame 5]
-        end
-    end
-    subgraph dataset
-        dataset1[dataset 1]
-        dataset2[dataset 2]
-    end
-    system1 -- frames --> dataset1
-    system2 --> dataset2
-    subgraph distribted sampler
-        ds1[distributed sampler 1]
-        ds2[distributed sampler 2]
-    end
-    dataset1 --> ds1
-    dataset2 --> ds2
-    subgraph dataloader
-        dataloader1[dataloader 1]
-        dataloader2[dataloader 2]
-    end
-    ds1 -- mini batch --> dataloader1
-    ds2 --> dataloader2
-    subgraph index[index on Rank 0]
-        dl11[dataloader 1, entry 1]
-        dl21[dataloader 2, entry 1]
-        dl22[dataloader 2, entry 2]
-    end
-    dataloader1 --> dl11
-    dataloader2 --> dl21
-    dataloader2 --> dl22
-    index -- for each step, choose 1 system --> WeightedSampler
-    --> dploaderset --> bufferedq[buffered queue] --> model
-```
-
 ### How to use
 
 We use [`paddle.distributed.fleet`](https://www.paddlepaddle.org.cn/documentation/docs/zh/guides/06_distributed_training/cluster_quick_start_collective_cn.html) to launch a DDP training session.

From af815433a1a068e2eab468ae3d85dee0c29b3a8b Mon Sep 17 00:00:00 2001
From: HydrogenSulfate <490868991@qq.com>
Date: Thu, 26 Dec 2024 13:58:41 +0800
Subject: [PATCH 5/8] correct paddle install scripts

---
 doc/env.md                  | 2 +-
 doc/install/easy-install.md | 9 +++++----
 2 files changed, 6 insertions(+), 5 deletions(-)

diff --git a/doc/env.md b/doc/env.md
index 5ff4cc695c..c11da35357 100644
--- a/doc/env.md
+++ b/doc/env.md
@@ -67,7 +67,7 @@ Control high (double) or low (float) precision of training.
 
 **Choices**: `0`, `1`; **Default**: `0`
 
-{{ paddle_icon }} Enable Paddle CINN Compiler when `PD_JIT` is enabled. Note that this option may either improve or decrease the performance. Requires Paddle to support CINN()(`paddle.device.is_compiled_with_cinn()` is `True`).
+{{ paddle_icon }} Enable Paddle CINN Compiler when `PD_JIT` is enabled. Note that this option may either improve or decrease the performance. Requires Paddle to support CINN(`paddle.device.is_compiled_with_cinn()` is `True`).
 
 :::
 
diff --git a/doc/install/easy-install.md b/doc/install/easy-install.md
index 0bf8f98967..ff6b7015b4 100644
--- a/doc/install/easy-install.md
+++ b/doc/install/easy-install.md
@@ -193,7 +193,8 @@ Switch to the TensorFlow {{ tensorflow_icon }} tab for more information.
 ::::{tab-item} CUDA 12.3
 
 ```bash
-pip install deepmd-kit[paddle]
+pip install paddlepaddle-gpu==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cu123/
+pip install deepmd-kit
 ```
 
 ::::
@@ -201,8 +202,8 @@ pip install deepmd-kit[paddle]
 ::::{tab-item} CUDA 11.8
 
 ```bash
-pip install paddlepaddle-gpu==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cu123/
-pip install deepmd-kit-cu11
+pip install paddlepaddle-gpu==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cu118/
+pip install deepmd-kit
 ```
 
 ::::
@@ -210,7 +211,7 @@ pip install deepmd-kit-cu11
 ::::{tab-item} CPU
 
 ```bash
-pip install paddlepaddle-gpu==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cu118/
+pip install paddlepaddle==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cpu/
 pip install deepmd-kit
 ```
 

From 7064b3a4f981ac51e7e26a0f030e12f558ba1204 Mon Sep 17 00:00:00 2001
From: HydrogenSulfate <490868991@qq.com>
Date: Wed, 8 Jan 2025 10:38:21 +0800
Subject: [PATCH 6/8] remove the currently unnecessary content from the
 document

---
 doc/env.md                         | 15 ---------------
 doc/install/install-from-source.md | 10 +++-------
 2 files changed, 3 insertions(+), 22 deletions(-)

diff --git a/doc/env.md b/doc/env.md
index c11da35357..3cf42b724a 100644
--- a/doc/env.md
+++ b/doc/env.md
@@ -56,21 +56,6 @@ Control high (double) or low (float) precision of training.
 {{ tensorflow_icon }} Enable JIT. Note that this option may either improve or decrease the performance. Requires TensorFlow to support JIT.
 :::
 
-:::{envvar} PD_JIT
-
-**Choices**: `0`, `1`; **Default**: `0`
-
-{{ paddle_icon }} Enable Paddle JIT. Note that this option may either improve or decrease the performance.
-:::
-
-:::{envvar} PD_CINN
-
-**Choices**: `0`, `1`; **Default**: `0`
-
-{{ paddle_icon }} Enable Paddle CINN Compiler when `PD_JIT` is enabled. Note that this option may either improve or decrease the performance. Requires Paddle to support CINN(`paddle.device.is_compiled_with_cinn()` is `True`).
-
-:::
-
 :::{envvar} DP_INFER_BATCH_SIZE
 
 **Default**: `1024` on CPUs and as maximum as possible until out-of-memory on GPUs
diff --git a/doc/install/install-from-source.md b/doc/install/install-from-source.md
index 5643f6270a..ae54354401 100644
--- a/doc/install/install-from-source.md
+++ b/doc/install/install-from-source.md
@@ -156,12 +156,6 @@ Note that PyTorch may have specific requirements for the compiler version to sup
 
 :::
 
-:::{tab-item} Paddle {{ paddle_icon }}
-
-You can set the environment variable `export DP_ENABLE_PADDLE=1` to enable customized C++ OPs in the Paddle backend.
-
-:::
-
 ::::
 
 Execute
@@ -364,12 +358,14 @@ download the TensorFlow C library from [this page](https://www.tensorflow.org/in
 
 If you want to use C++ interface of Paddle, you need to compile the Paddle inference library(C++ interface) manually from the [linux-compile-by-make](https://www.paddlepaddle.org.cn/documentation/docs/zh/develop/install/compile/linux-compile-by-make.html), then use the `.so` and `.a` files in `Paddle/build/paddle_inference_install_dir/`.
 
-We also provide a nightly pre-compiled Paddle C++ library for Linux x86_64 with CUDA 11.8/12.3 below:
+We also provide a weekly-build Paddle C++ library for Linux x86_64 with CUDA 11.8/12.3/CPU below:
 
 [Cuda118_cudnn860_Trt8531_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cuda118_cudnn860_Trt8531_D1/latest/paddle_inference.tgz)
 
 [Cuda123_cudnn900_Trt8616_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cuda123_cudnn900_Trt8616_D1/latest/paddle_inference.tgz)
 
+[GITHUB_Docker_Compile_Test_Cpu_Mkl_Avx_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cpu_Mkl_Avx_D1/latest/paddle_inference.tgz)
+
 :::
 
 ::::

From b52ed35323326a9c06ba21c753734a17548d26af Mon Sep 17 00:00:00 2001
From: HydrogenSulfate <490868991@qq.com>
Date: Tue, 14 Jan 2025 10:55:35 +0800
Subject: [PATCH 7/8] update paddle related content in document

---
 doc/backend.md                     |  4 ++--
 doc/install/easy-install.md        |  6 +++---
 doc/install/install-from-source.md | 16 ++++++++--------
 3 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/doc/backend.md b/doc/backend.md
index 8062b623ca..cab8dc2128 100644
--- a/doc/backend.md
+++ b/doc/backend.md
@@ -5,7 +5,7 @@
 DeePMD-kit supports multiple backends: TensorFlow and PyTorch.
 To use DeePMD-kit, you must install at least one backend.
 Each backend does not support all features.
-In the documentation, TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }} and Paddle {{ paddle_icon }} icons are used to mark whether a backend supports a feature.
+In the documentation, TensorFlow {{ tensorflow_icon }}, PyTorch {{ pytorch_icon }}, and Paddle {{ paddle_icon }} icons are used to mark whether a backend supports a feature.
 
 ### TensorFlow {{ tensorflow_icon }}
 
@@ -42,7 +42,7 @@ Currently, this backend is developed actively, and has no support for training.
 
 [Paddle](https://www.paddlepaddle.org.cn/) version 3.0 or above is required.
 
-The `.pd` extension is used for model checkpoint storage, which is commonly utilized during training and testing in Python. The `.json` extension is for the model's computational graph in [PIR representation](https://www.paddlepaddle.org.cn/documentation/docs/zh/develop/guides/paddle_v3_features/paddle_ir_cn.html), while the `.pdiparams` extension stores model parameters. Both `.json` and `.pdiparams` files are exported together and used in model freezing and C++ inference.
+The `.pd` extension is used for model checkpoint storage, which is commonly utilized during training and testing in Python. The `.json` extension is for the model's computational graph in [PIR representation](https://www.paddlepaddle.org.cn/documentation/docs/zh/develop/guides/paddle_v3_features/paddle_ir_cn.html), while the `.pdiparams` extension stores model parameters. Both `.json` and `.pdiparams` files are exported together and used in model freezing and Python/C++ inference.
 
 ### DP {{ dpmodel_icon }}
 
diff --git a/doc/install/easy-install.md b/doc/install/easy-install.md
index ff6b7015b4..16dd2c1eb2 100644
--- a/doc/install/easy-install.md
+++ b/doc/install/easy-install.md
@@ -193,7 +193,7 @@ Switch to the TensorFlow {{ tensorflow_icon }} tab for more information.
 ::::{tab-item} CUDA 12.3
 
 ```bash
-pip install paddlepaddle-gpu==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cu123/
+pip install paddlepaddle-gpu==3.0.0rc0 -i https://www.paddlepaddle.org.cn/packages/stable/cu123/
 pip install deepmd-kit
 ```
 
@@ -202,7 +202,7 @@ pip install deepmd-kit
 ::::{tab-item} CUDA 11.8
 
 ```bash
-pip install paddlepaddle-gpu==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cu118/
+pip install paddlepaddle-gpu==3.0.0rc0 -i https://www.paddlepaddle.org.cn/packages/stable/cu118/
 pip install deepmd-kit
 ```
 
@@ -211,7 +211,7 @@ pip install deepmd-kit
 ::::{tab-item} CPU
 
 ```bash
-pip install paddlepaddle==3.0.0b2 -i https://www.paddlepaddle.org.cn/packages/stable/cpu/
+pip install paddlepaddle==3.0.0rc0 -i https://www.paddlepaddle.org.cn/packages/stable/cpu/
 pip install deepmd-kit
 ```
 
diff --git a/doc/install/install-from-source.md b/doc/install/install-from-source.md
index ae54354401..14e4981ad3 100644
--- a/doc/install/install-from-source.md
+++ b/doc/install/install-from-source.md
@@ -99,11 +99,11 @@ To install Paddle, run
 
 ```sh
 # cu123
-pip install --pre paddlepaddle-gpu -i https://www.paddlepaddle.org.cn/packages/nightly/cu123/
+pip install paddlepaddle-gpu==3.0.0rc0 -i https://www.paddlepaddle.org.cn/packages/stable/cu123/
 # cu118
-pip install --pre paddlepaddle-gpu -i https://www.paddlepaddle.org.cn/packages/nightly/cu118/
+pip install paddlepaddle-gpu==3.0.0rc0 -i https://www.paddlepaddle.org.cn/packages/stable/cu118/
 # cpu
-pip install --pre paddlepaddle -i https://www.paddlepaddle.org.cn/packages/nightly/cpu/
+pip install paddlepaddle==3.0.0rc0 -i https://www.paddlepaddle.org.cn/packages/stable/cpu/
 ```
 
 :::
@@ -228,7 +228,7 @@ The path to the ROCM toolkit directory. If `ROCM_ROOT` is not set, it will look
 
 **Type**: Path; **Default**: None
 
-{{ paddle_icon }} The path to Paddle inference library, e.g. `/path/to/paddle_inference_install_dir`. If `DP_ENABLE_PADDLE` is enabled, it needs to be specified manually; otherwise, installation will fail.
+{{ paddle_icon }} The path to Paddle inference library, e.g. `/path/to/paddle_inference_install_dir`.
 :::
 
 :::{envvar} DP_ENABLE_NATIVE_OPTIMIZATION
@@ -358,13 +358,13 @@ download the TensorFlow C library from [this page](https://www.tensorflow.org/in
 
 If you want to use C++ interface of Paddle, you need to compile the Paddle inference library(C++ interface) manually from the [linux-compile-by-make](https://www.paddlepaddle.org.cn/documentation/docs/zh/develop/install/compile/linux-compile-by-make.html), then use the `.so` and `.a` files in `Paddle/build/paddle_inference_install_dir/`.
 
-We also provide a weekly-build Paddle C++ library for Linux x86_64 with CUDA 11.8/12.3/CPU below:
+We also provide a weekly-build Paddle C++ inference library for Linux x86_64 with CUDA 11.8/12.3/CPU below:
 
-[Cuda118_cudnn860_Trt8531_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cuda118_cudnn860_Trt8531_D1/latest/paddle_inference.tgz)
+CUDA 11.8: [Cuda118_cudnn860_Trt8531_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cuda118_cudnn860_Trt8531_D1/latest/paddle_inference.tgz)
 
-[Cuda123_cudnn900_Trt8616_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cuda123_cudnn900_Trt8616_D1/latest/paddle_inference.tgz)
+CUDA 12.3: [Cuda123_cudnn900_Trt8616_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cuda123_cudnn900_Trt8616_D1/latest/paddle_inference.tgz)
 
-[GITHUB_Docker_Compile_Test_Cpu_Mkl_Avx_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cpu_Mkl_Avx_D1/latest/paddle_inference.tgz)
+CPU: [GITHUB_Docker_Compile_Test_Cpu_Mkl_Avx_D1/latest/paddle_inference.tgz](https://paddle-qa.bj.bcebos.com/paddle-pipeline/GITHUB_Docker_Compile_Test_Cpu_Mkl_Avx_D1/latest/paddle_inference.tgz)
 
 :::
 

From da6547b16a356a888f0cc21dbd5c26ed3ab5018e Mon Sep 17 00:00:00 2001
From: HydrogenSulfate <490868991@qq.com>
Date: Tue, 14 Jan 2025 21:02:36 +0800
Subject: [PATCH 8/8] remove two FLAGs that are not used currently

---
 doc/install/install-from-source.md | 14 --------------
 1 file changed, 14 deletions(-)

diff --git a/doc/install/install-from-source.md b/doc/install/install-from-source.md
index 14e4981ad3..71337db084 100644
--- a/doc/install/install-from-source.md
+++ b/doc/install/install-from-source.md
@@ -203,13 +203,6 @@ The path to the ROCM toolkit directory. If `ROCM_ROOT` is not set, it will look
 {{ pytorch_icon }} Enable customized C++ OPs for the PyTorch backend. PyTorch can still run without customized C++ OPs, but features will be limited.
 :::
 
-:::{envvar} DP_ENABLE_PADDLE
-
-**Choices**: `0`, `1`; **Default**: `0`
-
-{{ paddle_icon }} Enable customized C++ OPs for the Paddle backend. Paddle can still run without customized C++ OPs, but features will be limited.
-:::
-
 :::{envvar} TENSORFLOW_ROOT
 
 **Type**: Path; **Default**: Detected automatically
@@ -224,13 +217,6 @@ The path to the ROCM toolkit directory. If `ROCM_ROOT` is not set, it will look
 {{ pytorch_icon }} The path to PyTorch Python library. If not given, by default, the installer only finds PyTorch under the user site-package directory (`site.getusersitepackages()`) or the system site-package directory (`sysconfig.get_path("purelib")`) due to the limitation of [PEP-517](https://peps.python.org/pep-0517/). If not found, the latest PyTorch (or the environment variable `PYTORCH_VERSION` if given) from PyPI will be built against.
 :::
 
-:::{envvar} PADDLE_INFERENCE_DIR
-
-**Type**: Path; **Default**: None
-
-{{ paddle_icon }} The path to Paddle inference library, e.g. `/path/to/paddle_inference_install_dir`.
-:::
-
 :::{envvar} DP_ENABLE_NATIVE_OPTIMIZATION
 
 **Choices**: `0`, `1`; **Default**: `0`