Commit 684703f
[LLM] First commit the llm deployment code
1 parent 980c0a1 commit 684703f
11,814 files changed
Lines changed: 127294 additions & 1293102 deletions
File tree
- benchmark
- cpp
- config
- paddlex
- config
- python
- c_api
- fastdeploy_capi
- core
- internal
- runtime
- vision
- classification/ppcls
- detection
- contrib/yolo
- ppdet
- ocr/ppocr
- segmentation/ppseg
- cmake
- cpack
- csharp
- fastdeploy
- vision
- classification/ppcls
- detection
- contrib
- ppdet
- ocr
- segmentation
- custom_ops
- cpu_ops
- gpu_ops
- append_attn
- template_instantiation
- common
- cutlass_extensions
- arch
- epilogue
- threadblock
- thread
- gemm
- collective
- device
- kernel
- threadblock
- warp
- transform/threadblock
- util
- cutlass_kernels
- fp8_gemm_fused
- dual_gemm
- device
- kernel
- threadblock
- thread
- fpA_intB_gemm
- moe_gemm
- w4a8_moe
- cutlass_extensions
- arch
- epilogue
- threadblock
- gemm
- kernel
- threadblock
- warp
- fp8_deep_gemm
- deep_gemm
- include/deep_gemm
- jit_kernels
- jit
- tests
- fp8_gemm_with_cutlass
- glog
- int8_gemm_with_cutlass
- moe
- speculate_decoding
- draft_model
- docs
- api_docs
- cpp
- csharp
- python
- api/vision_results
- cn
- build_and_install
- faq
- horizon
- rknpu2
- quick_start
- models
- runtime
- docs_i18n
- en
- build_and_install
- faq
- horizon
- rknpu2
- quick_start
- models
- runtime
- examples
- application
- go
- ppyoloe
- yolov5
- yolov8
- java
- ppyoloe
- cpp
- java
- yolov5
- cpp
- java
- yolov8
- cpp
- java
- js
- converter
- mini_program
- ocrXcx
- pages/index
- img
- wasm
- ocrdetectXcx
- pages/index
- img
- wasm
- package
- packages/paddlejs-models
- detect
- build_package
- src
- test
- facedetect
- build_package
- src
- test
- gesture
- build_package
- src
- test
- humanseg_gpu
- build_package
- src
- customOp
- customTransformer
- test
- thirdParty
- humanseg
- build_package
- src
- customOp
- customTransformer
- test
- thirdParty
- mobilenet
- build_package
- src
- test
- ocrdetection
- build_package
- src
- test
- ocr
- build_package
- src
- test
- web_demo
- public
- src
- assets
- components
- icons
- pages
- cv
- detection
- FaceDetection
- ScrewDetection
- ocr
- TextDetection
- TextRecognition
- recognition
- GestureRecognition
- ItemIdentification
- WineBottleIdentification
- segmentation
- HumanSeg_gpu
- HumanSeg
- main
- img
- router
- utils
- views
- detection
- ocr
- recognition
- segmentation
- utils
- rust
- ppyoloe
- src
- yolov5
- src
- yolov8
- src
- audio
- pp-tts
- python
- serving
- streaming_pp_tts
- 1
- silero-vad
- cpp
- multimodal/stable_diffusion
- cpp
- swift+coreml
- ml-stable-diffusion
- swift_coreml_diffusers
- swift_simplest_demo
- swift_stable_diffusion_demo.xcodeproj
- project.xcworkspace
- xcuserdata/lishicheng03.xcuserdatad/xcschemes
- swift_stable_diffusion_demo
- runtime
- cpp
- python
- text
- ernie-3.0
- cpp
- python
- serving
- models
- ernie_seqcls_model
- 1
- ernie_seqcls_postprocess
- 1
- ernie_seqcls
- 1
- ernie_tokencls_model
- 1
- ernie_tokencls_postprocess
- 1
- ernie_tokencls
- 1
- ernie_tokenizer
- 1
- uie
- cpp
- python
- serving
- models/uie
- 1
- vision
- classification
- paddleclas
- amlogic/a311d
- cpp
- android
- app
- src
- androidTest/java/com/baidu/paddle/fastdeploy
- main
- assets/labels
- java/com/baidu/paddle/fastdeploy/app
- examples/classification
- ui
- layout
- view
- adapter
- model
- res
- drawable-v24
- drawable-xhdpi
- drawable-xxhdpi-v4
- drawable
- layout
- mipmap-anydpi-v26
- mipmap-hdpi
- mipmap-mdpi
- mipmap-xhdpi
- mipmap-xxhdpi
- mipmap-xxxhdpi
- values
- xml
- gradle/wrapper
- ascend
- cpp
- python
- cpu-gpu
- cpp
- csharp
- c
- python
- graphcore
- cpp
- python
- horizon
- cpp
- kunlunxin
- cpp
- python
- quantize
- rockchip
- rknpu2
- cpp
- python
- rknpu2_tools
- config
- rv1126
- cpp
- serving
- models
- paddlecls
- 1
- postprocess
- 1
- preprocess
- 1
- runtime
- 1
- sophgo
- cpp
- python
- web
- ppshitu/cpu-gpu
- cpp
- python
- resnet
- cpp
- python
- yolov5cls
- cpp
- python
- detection
- fastestdet
- cpp
- python
- nanodet_plus
- cpp
- python
- paddledetection
- a311d
- cpp
- android
- app
- src
- androidTest/java/com/baidu/paddle/fastdeploy
- main
- assets/labels
- java/com/baidu/paddle/fastdeploy/app
- examples/detection
- ui
- layout
- view
- adapter
- model
- res
- drawable-v24
- drawable-xhdpi
- drawable-xxhdpi-v4
- drawable
- layout-land
- layout
- mipmap-anydpi-v26
- mipmap-hdpi
- mipmap-mdpi
- mipmap-xhdpi
- mipmap-xxhdpi
- mipmap-xxxhdpi
- values
- xml
- gradle/wrapper
- cpp
- csharp
- c
- horizon
- cpp
- python
- serving
- quantize
- cpp
- python
- rknpu2
- cpp
- python
- rv1126
- cpp
- serving
- models
- postprocess
- 1
- ppdet
- 1
- preprocess
- 1
- runtime
- 1
- sophgo
- cpp
- python
- tvm
- cpp
- python
- rkyolo
- cpp
- python
- scaledyolov4
- cpp
- python
- yolor
- cpp
- python
- yolov5lite
- cpp
- python
- yolov5seg
- cpp
- python
- yolov5
- a311d
- cpp
- cpp
- csharp
- c
- python
- serving
- quantize
- cpp
- python
- rv1126
- cpp
- serving
- models
- postprocess
- 1
- preprocess
- 1
- runtime
- 1
- yolov5
- 1
- sophgo
- cpp
- python
- yolov6
- cpp
- python
- quantize
- cpp
- python
- yolov7end2end_ort
- cpp
- python
- yolov7end2end_trt
- cpp
- python
- yolov7
- cpp
- python
- quantize
- cpp
- python
- yolov8
- cpp
- python
- yolox
- cpp
- python
- facealign
- face_landmark_1000
- cpp
- python
- pfld
- cpp
- python
- pipnet
- cpp
- python
- facedet
- blazeface
- cpp
- python
- centerface
- cpp
- python
- retinaface
- cpp
- python
- scrfd
- android
- app
- src
- androidTest/java/com/baidu/paddle/fastdeploy
- main
- assets/labels
- java/com/baidu/paddle/fastdeploy/app
- examples/facedet
- ui
- layout
- view
- adapter
- model
- res
- drawable-v24
- drawable-xhdpi
- drawable-xxhdpi-v4
- drawable
- layout
- mipmap-hdpi
- mipmap-mdpi
- mipmap-xhdpi
- mipmap-xxhdpi
- mipmap-xxxhdpi
- values
- xml
- gradle/wrapper
- cpp
- python
- rknpu2
- cpp
- python
- ultraface
- cpp
- python
- yolov5face
- cpp
- python
- yolov7face
- cpp
- python
- faceid
- adaface
- cpp
- python
- insightface
- cpp
- python
- rknpu2
- cpp
- python
- generation/anemigan
- cpp
- python
- headpose
- fsanet
- cpp
- python
- keypointdetection
- det_keypoint_unite
- cpp
- python
- tiny_pose
- cpp
- python
- rknpu2
- cpp
- python
- matting
- modnet
- cpp
- python
- ppmatting
- rvm
- cpp
- python
- ocr/PP-OCR
- android
- app
- src
- androidTest/java/com/baidu/paddle/fastdeploy
- main
- assets/labels
- java/com/baidu/paddle/fastdeploy/app
- examples/ocr
- ui
- layout
- view
- adapter
- model
- res
- drawable-v24
- drawable-xhdpi
- drawable-xxhdpi-v4
- drawable
- layout-land
- layout
- mipmap-anydpi-v26
- mipmap-hdpi
- mipmap-mdpi
- mipmap-xhdpi
- mipmap-xxhdpi
- mipmap-xxxhdpi
- values
- xml
- gradle/wrapper
- ascend
- cpp
- python
- cpu-gpu
- cpp
- csharp
- c
- python
- kunlunxin
- cpp
- python
- rockchip
- cpp
- python
- rknpu2_tools
- config
- serving
- fastdeploy_serving
- models
- cls_postprocess
- 1
- cls_pp
- cls_runtime
- det_postprocess
- 1
- det_preprocess
- 1
- det_runtime
- pp_ocr
- rec_postprocess
- 1
- rec_pp
- rec_runtime
- simple_serving
- sophgo
- cpp
- python
- web
- perception/paddle3d
- centerpoint/cpp
- petr
- cpp
- python
- smoke
- cpp
- python
- serving
- models
- postprocess
- 1
- preprocess
- 1
- runtime
- 1
- smoke
- 1
- segmentation/paddleseg
- matting
- ascend
- cpu-gpu
- cpp
- python
- kunlunxin
- semantic_segmentation
- amlogic/a311d
- cpp
- android
- app
- src
- androidTest/java/com/baidu/paddle/fastdeploy
- main
- assets/labels
- java/com/baidu/paddle/fastdeploy/app
- examples/segmentation
- ui
- layout
- view
- adapter
- model
- res
- drawable-v24
- drawable-xhdpi
- drawable-xxhdpi-v4
- drawable
- layout
- mipmap-anydpi-v26
- mipmap-hdpi
- mipmap-mdpi
- mipmap-xhdpi
- mipmap-xxhdpi
- mipmap-xxxhdpi
- values
- xml
- gradle/wrapper
- ascend
- cpp
- python
- cpu-gpu
- cpp
- csharp
- c
- python
- kunlunxin
- cpp
- python
- quantize
- rockchip
- rknpu2
- cpp
- python
- rv1126
- cpp
- serving
- fastdeploy_serving
- PP_LiteSeg_B_STDC2_cityscapes_with_argmax_infer
- models
- paddleseg
- 1
- postprocess
- 1
- preprocess
- 1
- runtime
- 1
- simple_serving
- sophgo
- cpp
- python
- web
- sr
- basicvsr
- cpp
- python
- edvr
- cpp
- python
- ppmsvsr
- cpp
- python
- tracking/pptracking
- cpp
- python
- fastdeploy
- benchmark
- core
- distributed
- encryption
- include
- src
- util
- include
- constant
- crypto
- src
- crypto
- engine
- entrypoints
- openai
- function
- input
- mm_processor
- image_preprocessor
- tokenizer
- utils
- multimodal
- metrics
- model_executor
- eplb
- graph_optimization
- layers
- attention
- ops
- backends
- npu
- xpu
- quantization
- moe
- quantization
- sample
- ops
- models
- ops
- cpu
- gpu
- npu
- xpu
- pipeline
- pptinypose
- platforms
- pybind
- runtime
- backends
- common/cuda
- horizon
- lite
- openvino
- ort
- ops
- paddle
- ops
- poros
- common
- rknpu2
- sophgo
- tensorrt
- ops
- tvm
- scheduler
- text
- common
- postprocessor
- preprocessor
- uie
- utils
- vision
- classification
- contrib
- yolov5cls
- ppcls
- ppshitu
- common
- image_decoder
- processors
- detection/contrib
- fastestdet
- rknpu2
- yolov5
Some content is hidden
Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.
This file was deleted.
This file was deleted.
0 commit comments