diff --git a/README.md b/README.md
index dbdd66dd821459e9e85674c01185cda73a6fc39a..a6c0bd4eafadfc836067176cd6aba71ff0a89806 100644
--- a/README.md
+++ b/README.md
@@ -46,10 +46,10 @@ Paddle Lite提供了C++、Java、Python三种API，并且提供了相应API的
 - [CUDA示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/cuda.html)
 - [OpenCL示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/opencl.html)
 - [FPGA示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/fpga.html)
-- [Huawei NPU示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/npu.html)
-- [Baidu XPU示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/baidu_xpu.html)
-- [RKNPU示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/rockchip_npu.html)
-- [MTK APU示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/mediatek_apu.html)
+- [华为NPU示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/huawei_kirin_npu.html)
+- [百度XPU示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/baidu_xpu.html)
+- [瑞芯微NPU示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/rockchip_npu.html)
+- [联发科APU示例](https://paddle-lite.readthedocs.io/zh/latest/demo_guides/mediatek_apu.html)
 
 
 
diff --git a/docs/introduction/support_operation_list.md b/docs/introduction/support_operation_list.md
index 7a60cf46e424dfe610a0541c9e364cf6e5d98531..1a0ba4e3c60b6dafdb42fc97299847894069b714 100644
--- a/docs/introduction/support_operation_list.md
+++ b/docs/introduction/support_operation_list.md
@@ -1,402 +1,222 @@
-# 支持OP
+# 支持算子
 
-## Ops （共计158个算子）
+当前Paddle-Lite共计支持算子204个，其中基础算子78个，附加算子126个。
 
-### Basic Operators (默认编译的算子)
-- affine_channel
-- arg_max
-- batch_norm
-- bilinear_interp
-- box_coder
-- calib
-- cast
-- concat
-- conv2d
-- conv2d_transpose
-- density_prior_box
-- depthwise_conv2d
-- dropout
-- elementwise_add
-- elementwise_div
-- elementwise_max
-- elementwise_mul
-- elementwise_sub
-- exp
-- expand
-- fake_channel_wise_dequantize_max_abs
-- fake_dequantize_max_abs
-- fake_quantize_abs_max
-- fake_quantize_dequantize_moving_average_abs_max
-- fake_quantize_moving_average_abs_max
-- fake_quantize_range_abs_max
-- fc
-- feed
-- fetch
-- fill_constant
-- fill_constant_batch_size_like
-- flatten
-- flatten2
-- floor
-- fusion_elementwise_add_activation
-- fusion_elementwise_div_activation
-- fusion_elementwise_max_activation
-- fusion_elementwise_mul_activation
-- fusion_elementwise_sub_activation
-- gelu
-- grid_sampler
-- hard_sigmoid
-- instance_norm
-- io_copy
-- io_copy_once
-- layout
-- leaky_relu
-- log
-- matmul
-- mean
-- mul
-- multiclass_nms
-- nearest_interp
-- pad2d
-- pool2d
-- prelu
-- prior_box
-- range
-- reduce_mean
-- relu
-- relu6
-- relu_clipped
-- reshape
-- reshape2
-- rsqrt
-- scale
-- search_fc
-- sequence_topk_avg_pooling
-- shuffle_channel
-- sigmoid
-- slice
-- softmax
-- softsign
-- split
-- sqrt
-- square
-- squeeze
-- squeeze2
-- stack
-- subgraph
-- swish
-- tanh
-- transpose
-- transpose2
-- unsqueeze
-- unsqueeze2
-- yolo_box
+### 基础算子
 
-### Extra Operators (打开 `--build_extra=ON`开关才会编译)
+默认编译的算子，共计78个：
 
-- anchor_generator
-- assign
-- assign_value
-- attention_padding_mask
-- axpy
-- beam_search
-- beam_search_decode
-- box_clip
-- calib_once
-- collect_fpn_proposals
-- conditional_block
-- crop
-- decode_bboxes
-- distribute_fpn_proposals
-- equal
-- gather
-- generate_proposals
-- graph_op
-- greater_equal
-- greater_than
-- gru
-- gru_unit
-- im2sequence
-- increment
-- is_empty
-- layer_norm
-- layout_once
-- less_equal
-- less_than
-- lod_reset
-- logical_and
-- logical_not
-- logical_or
-- logical_xor
-- lookup_table
-- lookup_table_v2
-- lrn
-- match_matrix_tensor
-- merge_lod_tensor
-- negative
-- norm
-- not_equal
-- power
-- read_from_array
-- reduce_max
-- reduce_prod
-- reduce_sum
-- roi_align
-- search_aligned_mat_mul
-- search_attention_padding_mask
-- search_grnn
-- search_group_padding
-- search_seq_arithmetic
-- search_seq_depadding
-- search_seq_fc
-- search_seq_softmax
-- sequence_arithmetic
-- sequence_concat
-- sequence_expand
-- sequence_expand_as
-- sequence_pool
-- sequence_reshape
-- sequence_reverse
-- sequence_softmax
-- shape
-- split_lod_tensor
-- top_k
-- uniform_random
-- var_conv_2d
-- while
-- write_to_array
+| OP Name | Host | X86 | CUDA | ARM | OpenCL | FPGA | 华为NPU | 百度XPU | 瑞芯微NPU | 联发科APU |
+|-:|-|-|-|-|-|-|-|-|-|-|
+| affine_channel | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| affine_grid | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| arg_max | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| assign_value | 　 | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| batch_norm | 　 | Y | 　 | Y | 　 | 　 | Y | Y | Y | 　 |
+| bilinear_interp | 　 | 　 | Y | Y | Y | 　 | Y | 　 | 　 | 　 |
+| box_coder | 　 | 　 | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 |
+| calib | 　 | 　 | Y | Y | 　 | Y | 　 | 　 | 　 | 　 |
+| cast | 　 | Y | 　 | Y | 　 | 　 | 　 | Y | 　 | 　 |
+| concat | 　 | Y | Y | Y | Y | 　 | Y | 　 | Y | 　 |
+| conv2d | 　 | Y | Y | Y | Y | Y | Y | Y | Y | Y |
+| conv2d_transpose | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| density_prior_box | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| depthwise_conv2d | 　 | Y | Y | Y | Y | Y | Y | Y | Y | Y |
+| depthwise_conv2d_transpose | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| dropout | 　 | Y | Y | Y | Y | Y | Y | Y | 　 | 　 |
+| elementwise_add | 　 | Y | Y | Y | Y | Y | Y | Y | Y | Y |
+| elementwise_div | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | Y | 　 |
+| elementwise_max | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| elementwise_mod | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| elementwise_mul | 　 | Y | Y | Y | Y | Y | Y | 　 | Y | Y |
+| elementwise_pow | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| elementwise_sub | 　 | Y | Y | Y | Y | 　 | Y | 　 | Y | 　 |
+| elu | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| expand | Y | 　 | 　 | 　 | Y | 　 | Y | 　 | 　 | 　 |
+| expand_as | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| fc | 　 | Y | Y | Y | Y | Y | Y | 　 | Y | Y |
+| feed | Y | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 | 　 |
+| fetch | Y | 　 | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 |
+| fill_constant | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| fill_constant_batch_size_like | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| flatten | Y | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 |
+| flatten2 | Y | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 |
+| fusion_elementwise_add_activation | 　 | 　 | Y | Y | Y | Y | Y | 　 | 　 | 　 |
+| fusion_elementwise_div_activation | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| fusion_elementwise_max_activation | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| fusion_elementwise_mul_activation | 　 | 　 | Y | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| fusion_elementwise_sub_activation | 　 | 　 | Y | Y | Y | 　 | Y | 　 | 　 | 　 |
+| grid_sampler | 　 | 　 | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 |
+| instance_norm | 　 | 　 | 　 | Y | Y | 　 | Y | 　 | 　 | 　 |
+| io_copy | 　 | 　 | Y | 　 | Y | Y | 　 | 　 | 　 | 　 |
+| io_copy_once | 　 | 　 | Y | 　 | Y | Y | 　 | 　 | 　 | 　 |
+| layout | 　 | 　 | Y | Y | Y | Y | 　 | 　 | 　 | 　 |
+| leaky_relu | 　 | Y | Y | Y | Y | 　 | Y | 　 | 　 | 　 |
+| matmul | 　 | Y | Y | Y | 　 | 　 | Y | Y | 　 | 　 |
+| mul | 　 | Y | Y | Y | 　 | 　 | Y | Y | 　 | 　 |
+| multiclass_nms | Y | 　 | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 |
+| multiclass_nms2 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| nearest_interp | 　 | 　 | Y | Y | Y | 　 | Y | 　 | 　 | 　 |
+| pad2d | 　 | 　 | 　 | Y | Y | 　 | Y | 　 | 　 | 　 |
+| pool2d | 　 | Y | Y | Y | Y | Y | Y | Y | Y | Y |
+| prelu | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| prior_box | 　 | 　 | 　 | Y | 　 | Y | 　 | 　 | 　 | 　 |
+| range | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| reduce_mean | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| relu | 　 | Y | Y | Y | Y | 　 | Y | 　 | Y | Y |
+| relu6 | 　 | 　 | 　 | Y | Y | 　 | Y | 　 | 　 | 　 |
+| reshape | Y | Y | 　 | 　 | Y | 　 | Y | Y | 　 | 　 |
+| reshape2 | Y | Y | 　 | 　 | Y | 　 | Y | Y | 　 | 　 |
+| scale | 　 | Y | Y | Y | Y | Y | Y | Y | 　 | 　 |
+| search_fc | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_topk_avg_pooling | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| shuffle_channel | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| sigmoid | 　 | Y | Y | Y | Y | 　 | Y | 　 | 　 | 　 |
+| slice | 　 | Y | 　 | Y | Y | 　 | 　 | Y | 　 | 　 |
+| softmax | 　 | Y | Y | Y | 　 | 　 | Y | Y | Y | Y |
+| split | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| squeeze | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| squeeze2 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| stack | 　 | Y | 　 | Y | 　 | 　 | 　 | Y | 　 | 　 |
+| subgraph | 　 | 　 | 　 | 　 | 　 | 　 | Y | Y | Y | Y |
+| tanh | 　 | Y | Y | Y | Y | 　 | Y | Y | 　 | 　 |
+| thresholded_relu | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| transpose | 　 | Y | Y | Y | Y | 　 | Y | Y | 　 | 　 |
+| transpose2 | 　 | Y | Y | Y | Y | 　 | Y | Y | 　 | 　 |
+| unsqueeze | Y | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 | 　 |
+| unsqueeze2 | Y | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 | 　 |
+| yolo_box | 　 | 　 | Y | Y | 　 | 　 | 　 | Y | 　 | 　 |
 
 
+### 附加算子
 
-## Kernels
+附加算子共计126个，需要在编译时打开`--build_extra=ON`开关才会编译，具体请参考[参数详情](../source_compile/library)。
 
-### Host kernels
-
-- feed
-- fetch
-- flatten
-- flatten2
-- multiclass_nms
-- reshape
-- reshape2
-
-### ARM kernels
-
-- affine_channel
-- anchor_generator
-- arg_max
-- assign
-- assign_value
-- axpy
-- batch_norm
-- beam_search
-- beam_search_decode
-- bilinear_interp
-- box_clip
-- box_coder
-- cast
-- collect_fpn_proposals
-- concat
-- conditional_block
-- conv2d
-- conv2d_transpose
-- crop
-- decode_bboxes
-- density_prior_box
-- depthwise_conv2d
-- distribute_fpn_proposals
-- dropout
-- elementwise_add
-- elementwise_div
-- elementwise_max
-- elementwise_mul
-- elementwise_sub
-- equal
-- exp
-- expand
-- fc
-- fill_constant
-- fill_constant_batch_size_like
-- floor
-- fusion_elementwise_add_activation
-- fusion_elementwise_div_activation
-- fusion_elementwise_max_activation
-- fusion_elementwise_mul_activation
-- fusion_elementwise_sub_activation
-- gather
-- generate_proposals
-- greater_equal
-- greater_than
-- gru
-- gru_unit
-- hard_sigmoid
-- im2sequence
-- increment
-- instance_norm
-- is_empty
-- layer_norm
-- layout
-- layout_once
-- leaky_relu
-- less_equal
-- less_than
-- lod_reset
-- log
-- logical_and
-- logical_not
-- logical_or
-- logical_xor
-- lookup_table
-- lookup_table_v2
-- lrn
-- matmul
-- merge_lod_tensor
-- mul
-- nearest_interp
-- negative
-- norm
-- not_equal
-- pad2d
-- pool2d
-- power
-- prelu
-- prior_box
-- range
-- read_from_array
-- reduce_max
-- reduce_mean
-- reduce_prod
-- relu
-- relu6
-- relu_clipped
-- roi_align
-- rsqrt
-- scale
-- sequence_expand
-- sequence_pool
-- sequence_softmax
-- shape
-- shuffle_channel
-- sigmoid
-- slice
-- softmax
-- split
-- split_lod_tensor
-- squeeze
-- squeeze2
-- stack
-- swish
-- tanh
-- top_k
-- transpose
-- transpose2
-- unsqueeze
-- unsqueeze2
-- while
-- write_to_array
-- yolo_box
-
-
-### X86 kernels
-- batch_norm
-- cast
-- concat
-- conv2d
-- depthwise_conv2d
-- dropout
-- elementwise_add
-- elementwise_sub
-- fc
-- fill_constant_batch_size_like
-- gather
-- gelu
-- gru
-- layer_norm
-- match_matrix_tensor
-- matmul
-- mul
-- pool2d
-- reduce_sum
-- relu
-- reshape
-- reshape2
-- scale
-- search_aligned_mat_mul
-- search_attention_padding_mask
-- search_fc
-- search_grnn
-- search_group_padding
-- search_seq_arithmetic
-- search_seq_depadding
-- search_seq_fc
-- search_seq_softmax
-- sequence_arithmetic
-- sequence_concat
-- sequence_expand_as
-- sequence_pool
-- sequence_reverse
-- sequence_topk_avg_pooling
-- shape
-- slice
-- softmax
-- softsign
-- square
-- squeeze
-- squeeze2
-- stack
-- tanh
-- transpose
-- transpose2
-- var_conv_2d
-
-### CUDA kernels
-- attention_padding_mask
-- bilinear_interp
-- calib
-- concat
-- conv
-- dropout
-- elementwise_add
-- fusion_elementwise_add_activation
-- fusion_elementwise_mul_activation
-- elementwise_mul
-- feed
-- io_copy
-- layout
-- layout_once
-- leaky_relu
-- lookup_table
-- match_matrix_tensor
-- mul
-- nearest_interp
-- pool2d
-- relu
-- scale
-- search_aligned_mat_mul
-- search_fc
-- search_grnn
-- search_group_padding
-- search_seq_depadding
-- search_seq_fc
-- sequence_arithmetic
-- sequence_concat
-- sequence_pool
-- sequence_reverse
-- sequence_topk_avg_pooling
-- softmax
-- transpose
-- var_conv_2d
-- yolo_box
-
-### OpenCL kernels
-- conv2d
-- depthwise_conv2d
-- elementwise_add
-- fc
-- fusion_elementwise_add_activation
-- layout
-- layout_once
-- io_copy
-- io_copy_once
-- mul
-- pool2d
-- relu
+| OP Name | Host | X86 | CUDA | ARM | OpenCL | FPGA | 华为NPU | 百度XPU | 瑞芯微NPU | 联发科APU |
+|-:|-|-|-|-|-|-|-|-|-|-|
+| abs | 　 | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| anchor_generator | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| assign | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| attention_padding_mask | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| axpy | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| beam_search_decode | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| beam_search_decode | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| box_clip | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| calib_once | 　 | 　 | Y | Y | 　 | Y | 　 | 　 | 　 | 　 |
+| clip | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| collect_fpn_proposals | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| conditional_block | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| crf_decoding | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| crop | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| ctc_align | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| decode_bboxes | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| deformable_conv | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| distribute_fpn_proposals | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| equal | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| exp | 　 | 　 | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 |
+| fake_channel_wise_dequantize_max_abs | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| fake_dequantize_max_abs | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| fake_quantize_abs_max | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| fake_quantize_dequantize_abs_max | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| fake_quantize_dequantize_moving_average_abs_max | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| fake_quantize_moving_average_abs_max | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| fake_quantize_range_abs_max | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| floor | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| gather | 　 | Y | 　 | Y | 　 | 　 | 　 | Y | 　 | 　 |
+| gelu | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| generate_proposals | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| greater_equal | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| greater_than | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| group_norm | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| gru | 　 | Y | Y | Y | 　 | Y | 　 | 　 | 　 | 　 |
+| gru_unit | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| hard_sigmoid | 　 | 　 | 　 | Y | Y | 　 | Y | 　 | 　 | 　 |
+| hard_swish | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| im2sequence | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| increment | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| is_empty | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| layer_norm | 　 | Y | 　 | Y | 　 | 　 | Y | Y | 　 | 　 |
+| layout_once | 　 | 　 | Y | Y | 　 | Y | 　 | 　 | 　 | 　 |
+| less_equal | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| less_than | Y | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 | 　 |
+| lod_reset | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| log | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| logical_and | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| logical_not | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| logical_or | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| logical_xor | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| lookup_table | 　 | Y | Y | Y | 　 | 　 | 　 | Y | 　 | 　 |
+| lookup_table_dequant | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| lookup_table_v2 | 　 | Y | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| lrn | 　 | 　 | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 |
+| lstm | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| match_matrix_tensor | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| max_pool2d_with_index | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| mean | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| merge_lod_tensor | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| negative | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| norm | 　 | 　 | 　 | Y | 　 | Y | 　 | 　 | 　 | 　 |
+| not_equal | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| one_hot | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| pixel_shuffle | Y | 　 | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 |
+| pow | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| power | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| print | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| read_from_array | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| reciprocal | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| reduce_max | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| reduce_prod | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| reduce_sum | 　 | Y | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| relu_clipped | 　 | 　 | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| retinanet_detection_output | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| roi_align | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| rsqrt | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| search_aligned_mat_mul | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| search_attention_padding_mask | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| search_grnn | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| search_group_padding | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| search_seq_arithmetic | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| search_seq_depadding | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| search_seq_fc | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| search_seq_softmax | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_arithmetic | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_concat | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_conv | 　 | Y | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_expand | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_expand_as | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_mask | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_pad | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_pool | 　 | Y | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_pool_concat | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_reshape | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_reverse | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_reverse_embedding | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_softmax | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| sequence_unpad | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| shape | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| sign | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| softsign | 　 | Y | 　 | 　 | 　 | 　 | Y | 　 | 　 | 　 |
+| split_lod_tensor | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| sqrt | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 | 　 |
+| square | 　 | Y | 　 | Y | 　 | 　 | Y | 　 | 　 | 　 |
+| swish | 　 | 　 | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 |
+| top_k | 　 | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 |
+| topk_pooling | 　 | 　 | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| uniform_random | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| var_conv_2d | 　 | Y | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| where_index | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| while | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| write_to_array | Y | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | 　 |
+| __xpu__conv2d | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__embedding_with_eltwise_add | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__fc | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__mmdnn_bid_emb_att | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__mmdnn_bid_emb_grnn_att | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__mmdnn_bid_emb_grnn_att2 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__mmdnn_match_conv_topk | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__mmdnn_merge_all | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__mmdnn_search_attention | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__multi_encoder | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__resnet_cbam | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__resnet50 | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
+| __xpu__sfa_head | 　 | 　 | 　 | 　 | 　 | 　 | 　 | Y | 　 | 　 |
diff --git a/docs/quick_start/release_lib.md b/docs/quick_start/release_lib.md
index f708237ef6882412ed648bde72360a3b4c011ee4..5de27839d53df381915b2d4a2dbf6675aa42f6e7 100644
--- a/docs/quick_start/release_lib.md
+++ b/docs/quick_start/release_lib.md
@@ -80,5 +80,5 @@ pip install paddlelite
 - [FPGA源码编译](../demo_guides/fpga)
 - [华为NPU源码编译](../demo_guides/npu)
 - [百度XPU源码编译](../demo_guides/baidu_xpu)
-- [Rockchip NPU源码编译](../demo_guides/rockchip_npu)
-- [MediaTek APU源码编译](../demo_guides/mediatek_apu)
+- [瑞芯微NPU源码编译](../demo_guides/rockchip_npu)
+- [联发科APU源码编译](../demo_guides/mediatek_apu)
diff --git a/docs/source_compile/compile_env.md b/docs/source_compile/compile_env.md
index 0f1740a44ccc90f91876523befa504f0455e82e4..5322558afbf2c3ad09f04e0596ddc18f967ffabb 100644
--- a/docs/source_compile/compile_env.md
+++ b/docs/source_compile/compile_env.md
@@ -17,14 +17,14 @@ Paddle Lite提供了Android/iOS/X86平台的官方Release预测库下载，如
 - [Android源码编译](../source_compile/compile_andriod)
 - [iOS源码编译](../source_compile/compile_ios)
 - [ArmLinux源码编译](../source_compile/compile_linux)
-- [x86源码编译](../demo_guides/x86)
+- [X86源码编译](../demo_guides/x86)
 - [OpenCL源码编译](../demo_guides/opencl)
 - [CUDA源码编译](../demo_guides/cuda)
 - [FPGA源码编译](../demo_guides/fpga)
-- [华为NPU源码编译](../demo_guides/npu)
+- [华为NPU源码编译](../demo_guides/huawei_kirin_npu)
 - [百度XPU源码编译](../demo_guides/baidu_xpu)
-- [Rockchip NPU源码编译](../demo_guides/rockchip_npu)
-- [MediaTek APU源码编译](../demo_guides/mediatek_apu)
+- [瑞芯微NPU源码编译](../demo_guides/rockchip_npu)
+- [联发科APU源码编译](../demo_guides/mediatek_apu)
 - [模型优化工具opt源码编译](../user_guides/model_optimize_tool.html#opt)
 
 ## 1. Docker开发环境
diff --git a/docs/source_compile/compile_linux.md b/docs/source_compile/compile_linux.md
index d6be5ba8c55bac26e4a1a22750741f0dafef286f..5753982d2aa1eda0e4acaec764f682e0ddc7fa87 100644
--- a/docs/source_compile/compile_linux.md
+++ b/docs/source_compile/compile_linux.md
@@ -90,7 +90,7 @@ inference_lite_lib.armlinux.armv8
 --opt_model_dir:          输入模型的绝对路径，需要为opt转化之后的模型
 ```
 
-- 编译 Rockchip NPU 预测库方法，详情请参考：[PaddleLite使用RK NPU预测部署](../demo_guides/rockchip_npu)
+- 编译 瑞芯微(Rockchip) NPU 预测库方法，详情请参考：[PaddleLite使用RK NPU预测部署](../demo_guides/rockchip_npu)
 
 ```shell
 --with_rockchip_npu: (OFF|ON)    是否编译编译 huawei_kirin_npu 的预测库，默认为OFF
@@ -98,7 +98,7 @@ inference_lite_lib.armlinux.armv8
 ```
 
 
-- 编译 Baidu XPU 预测库方法, 详情请参考：[PaddleLite使用百度XPU预测部署](../demo_guides/baidu_xpu)
+- 编译 百度(Baidu) XPU 预测库方法, 详情请参考：[PaddleLite使用百度XPU预测部署](../demo_guides/baidu_xpu)
 
 ```shell
 --with_baidu_xpu: (OFF|ON)    是否编译编译 baidu_xpu 的预测库，默认为OFF
diff --git a/docs/source_compile/compile_options.md b/docs/source_compile/compile_options.md
index f24eb2ad1e07e085407c4145cda810137e268e9d..13254919ae44655176f97b8dbb7897ddb457f2eb 100644
--- a/docs/source_compile/compile_options.md
+++ b/docs/source_compile/compile_options.md
@@ -51,8 +51,8 @@
 | LITE_WITH_PYTHON |  编译支持[Python API](../api_reference/python_api_doc.html)的预测库 | X86 / CUDA |OFF |
 | LITE_WITH_OPENCL |  编译[OpenCL平台](../demo_guides/opencl.html)预测库 | OpenCL | OFF |
 | LITE_WITH_FPGA |  编译[FPGA平台](../demo_guides/fpga.html)预测库 | FPGA | OFF |
-| LITE_WITH_NPU |  编译[华为NPU平台](../demo_guides/npu.html)预测库 | NPU | OFF |
-| LITE_WITH_RKNPU |  编译[RK NPU平台](../demo_guides/rockchip_npu.html)预测库 | RKNPU | OFF |
+| LITE_WITH_NPU |  编译[华为NPU平台](../demo_guides/huawei_kirin_npu.html)预测库 | NPU | OFF |
+| LITE_WITH_RKNPU |  编译[瑞芯微NPU平台](../demo_guides/rockchip_npu.html)预测库 | RKNPU | OFF |
 | LITE_WITH_XPU |  编译[百度XPU平台](../demo_guides/baidu_xpu.html)预测库 | XPU |OFF |
 | LITE_WITH_XTCL | 通过XTCL方式支持百度XPU，默认Kernel方式 | XPU |OFF IF LITE_WITH_XPU |
-| LITE_WITH_APU | 编译[MTK APU平台](../demo_guides/mediatek_apu.html)预测库 | APU |OFF |
+| LITE_WITH_APU | 编译[联发科APU平台](../demo_guides/mediatek_apu.html)预测库 | APU |OFF |
diff --git a/docs/source_compile/library.md b/docs/source_compile/library.md
index 2514e198f84532d1239e090cf6b1d0f228ee6031..ee43c8eb20128a2ee73effb22de828ef24bca7a3 100644
--- a/docs/source_compile/library.md
+++ b/docs/source_compile/library.md
@@ -5,12 +5,12 @@ Lite预测库分为**基础预测库**和**全量预测库(with_extra)**：基
 
 编译时由编译选项 `build_extra`(默认为OFF)控制，`--build_extra=OFF`时编译**基础预测库**，`--build_extra=ON`时编译**全量预测库**。
 
-## 基础预测库( [基础OP列表](../introduction/support_operation_list.html#basic-operators) )
+## 基础预测库( [基础算子](../introduction/support_operation_list.html#id2) )
 
 
 ### 支持功能
 
-（1）87个[基础OP](../introduction/support_operation_list.html#basic-operators)       （2）9个基础模型       （3）3个in8量化模型
+（1）78个[基础算子](../introduction/support_operation_list.html#id2)       （2）9个基础模型       （3）3个in8量化模型
 
 
 ### 支持的模型
@@ -39,12 +39,12 @@ mobilenet_v1   mobilenet_v2   resnet50
 ```
 
 
-## 全量预测库( [OP列表](../introduction/support_operation_list.html#op) )
+## 全量预测库( [支持算子](../introduction/support_operation_list.html#id1) )
 
 
 ### 支持功能
 
-   Paddle-Lite中的全量算子（ [基础OP](../introduction/support_operation_list.html#basic-operators) + [Extra OP](../introduction/support_operation_list.html#extra-operators-build-extra-on) ）
+   Paddle-Lite中的全量算子（ [基础算子](../introduction/support_operation_list.html#id2) + [附加算子](../introduction/support_operation_list.html#id3) ）
 
 ### 特点
    包含更多算子、支持更多模型，但体量更大。