CMakeLists.txt
LICENSE
MANIFEST.in
NOTICE
README.md
setup.py
3rdparty/cub/cub/cub.cuh
3rdparty/cub/cub/util_allocator.cuh
3rdparty/cub/cub/util_arch.cuh
3rdparty/cub/cub/util_debug.cuh
3rdparty/cub/cub/util_device.cuh
3rdparty/cub/cub/util_macro.cuh
3rdparty/cub/cub/util_namespace.cuh
3rdparty/cub/cub/util_ptx.cuh
3rdparty/cub/cub/util_type.cuh
3rdparty/cub/cub/agent/agent_histogram.cuh
3rdparty/cub/cub/agent/agent_radix_sort_downsweep.cuh
3rdparty/cub/cub/agent/agent_radix_sort_upsweep.cuh
3rdparty/cub/cub/agent/agent_reduce.cuh
3rdparty/cub/cub/agent/agent_reduce_by_key.cuh
3rdparty/cub/cub/agent/agent_rle.cuh
3rdparty/cub/cub/agent/agent_scan.cuh
3rdparty/cub/cub/agent/agent_segment_fixup.cuh
3rdparty/cub/cub/agent/agent_select_if.cuh
3rdparty/cub/cub/agent/agent_spmv_orig.cuh
3rdparty/cub/cub/agent/single_pass_scan_operators.cuh
3rdparty/cub/cub/block/block_adjacent_difference.cuh
3rdparty/cub/cub/block/block_discontinuity.cuh
3rdparty/cub/cub/block/block_exchange.cuh
3rdparty/cub/cub/block/block_histogram.cuh
3rdparty/cub/cub/block/block_load.cuh
3rdparty/cub/cub/block/block_radix_rank.cuh
3rdparty/cub/cub/block/block_radix_sort.cuh
3rdparty/cub/cub/block/block_raking_layout.cuh
3rdparty/cub/cub/block/block_reduce.cuh
3rdparty/cub/cub/block/block_scan.cuh
3rdparty/cub/cub/block/block_shuffle.cuh
3rdparty/cub/cub/block/block_store.cuh
3rdparty/cub/cub/block/specializations/block_histogram_atomic.cuh
3rdparty/cub/cub/block/specializations/block_histogram_sort.cuh
3rdparty/cub/cub/block/specializations/block_reduce_raking.cuh
3rdparty/cub/cub/block/specializations/block_reduce_raking_commutative_only.cuh
3rdparty/cub/cub/block/specializations/block_reduce_warp_reductions.cuh
3rdparty/cub/cub/block/specializations/block_scan_raking.cuh
3rdparty/cub/cub/block/specializations/block_scan_warp_scans.cuh
3rdparty/cub/cub/block/specializations/block_scan_warp_scans2.cuh
3rdparty/cub/cub/block/specializations/block_scan_warp_scans3.cuh
3rdparty/cub/cub/device/device_histogram.cuh
3rdparty/cub/cub/device/device_partition.cuh
3rdparty/cub/cub/device/device_radix_sort.cuh
3rdparty/cub/cub/device/device_reduce.cuh
3rdparty/cub/cub/device/device_run_length_encode.cuh
3rdparty/cub/cub/device/device_scan.cuh
3rdparty/cub/cub/device/device_segmented_radix_sort.cuh
3rdparty/cub/cub/device/device_segmented_reduce.cuh
3rdparty/cub/cub/device/device_select.cuh
3rdparty/cub/cub/device/device_spmv.cuh
3rdparty/cub/cub/device/dispatch/dispatch_histogram.cuh
3rdparty/cub/cub/device/dispatch/dispatch_radix_sort.cuh
3rdparty/cub/cub/device/dispatch/dispatch_reduce.cuh
3rdparty/cub/cub/device/dispatch/dispatch_reduce_by_key.cuh
3rdparty/cub/cub/device/dispatch/dispatch_rle.cuh
3rdparty/cub/cub/device/dispatch/dispatch_scan.cuh
3rdparty/cub/cub/device/dispatch/dispatch_select_if.cuh
3rdparty/cub/cub/device/dispatch/dispatch_spmv_orig.cuh
3rdparty/cub/cub/grid/grid_barrier.cuh
3rdparty/cub/cub/grid/grid_even_share.cuh
3rdparty/cub/cub/grid/grid_mapping.cuh
3rdparty/cub/cub/grid/grid_queue.cuh
3rdparty/cub/cub/host/mutex.cuh
3rdparty/cub/cub/iterator/arg_index_input_iterator.cuh
3rdparty/cub/cub/iterator/cache_modified_input_iterator.cuh
3rdparty/cub/cub/iterator/cache_modified_output_iterator.cuh
3rdparty/cub/cub/iterator/constant_input_iterator.cuh
3rdparty/cub/cub/iterator/counting_input_iterator.cuh
3rdparty/cub/cub/iterator/discard_output_iterator.cuh
3rdparty/cub/cub/iterator/tex_obj_input_iterator.cuh
3rdparty/cub/cub/iterator/tex_ref_input_iterator.cuh
3rdparty/cub/cub/iterator/transform_input_iterator.cuh
3rdparty/cub/cub/thread/thread_load.cuh
3rdparty/cub/cub/thread/thread_operators.cuh
3rdparty/cub/cub/thread/thread_reduce.cuh
3rdparty/cub/cub/thread/thread_scan.cuh
3rdparty/cub/cub/thread/thread_search.cuh
3rdparty/cub/cub/thread/thread_store.cuh
3rdparty/cub/cub/warp/warp_reduce.cuh
3rdparty/cub/cub/warp/warp_scan.cuh
3rdparty/cub/cub/warp/specializations/warp_reduce_shfl.cuh
3rdparty/cub/cub/warp/specializations/warp_reduce_smem.cuh
3rdparty/cub/cub/warp/specializations/warp_scan_shfl.cuh
3rdparty/cub/cub/warp/specializations/warp_scan_smem.cuh
3rdparty/cub/examples/block/example_block_radix_sort.cu
3rdparty/cub/examples/block/example_block_reduce.cu
3rdparty/cub/examples/block/example_block_scan.cu
3rdparty/cub/examples/block/reduce_by_key.cu
3rdparty/cub/examples/device/example_device_partition_flagged.cu
3rdparty/cub/examples/device/example_device_partition_if.cu
3rdparty/cub/examples/device/example_device_radix_sort.cu
3rdparty/cub/examples/device/example_device_reduce.cu
3rdparty/cub/examples/device/example_device_scan.cu
3rdparty/cub/examples/device/example_device_select_flagged.cu
3rdparty/cub/examples/device/example_device_select_if.cu
3rdparty/cub/examples/device/example_device_select_unique.cu
3rdparty/cub/examples/device/example_device_sort_find_non_trivial_runs.cu
3rdparty/cub/experimental/histogram_compare.cu
3rdparty/cub/experimental/sparse_matrix.h
3rdparty/cub/experimental/spmv_compare.cu
3rdparty/cub/experimental/defunct/example_coo_spmv.cu
3rdparty/cub/experimental/defunct/test_device_seg_reduce.cu
3rdparty/cub/experimental/histogram/histogram_cub.h
3rdparty/cub/experimental/histogram/histogram_gmem_atomics.h
3rdparty/cub/experimental/histogram/histogram_smem_atomics.h
3rdparty/cub/test/half.h
3rdparty/cub/test/link_a.cu
3rdparty/cub/test/link_b.cu
3rdparty/cub/test/link_main.cpp
3rdparty/cub/test/mersenne.h
3rdparty/cub/test/test_allocator.cu
3rdparty/cub/test/test_block_histogram.cu
3rdparty/cub/test/test_block_load_store.cu
3rdparty/cub/test/test_block_radix_sort.cu
3rdparty/cub/test/test_block_reduce.cu
3rdparty/cub/test/test_block_scan.cu
3rdparty/cub/test/test_device_histogram.cu
3rdparty/cub/test/test_device_radix_sort.cu
3rdparty/cub/test/test_device_reduce.cu
3rdparty/cub/test/test_device_reduce_by_key.cu
3rdparty/cub/test/test_device_run_length_encode.cu
3rdparty/cub/test/test_device_scan.cu
3rdparty/cub/test/test_device_select_if.cu
3rdparty/cub/test/test_device_select_unique.cu
3rdparty/cub/test/test_grid_barrier.cu
3rdparty/cub/test/test_iterator.cu
3rdparty/cub/test/test_util.h
3rdparty/cub/test/test_warp_reduce.cu
3rdparty/cub/test/test_warp_scan.cu
3rdparty/cub/tune/tune_device_reduce.cu
3rdparty/pybind11/CMakeLists.txt
3rdparty/pybind11/docs/requirements.txt
3rdparty/pybind11/include/pybind11/attr.h
3rdparty/pybind11/include/pybind11/buffer_info.h
3rdparty/pybind11/include/pybind11/cast.h
3rdparty/pybind11/include/pybind11/chrono.h
3rdparty/pybind11/include/pybind11/common.h
3rdparty/pybind11/include/pybind11/complex.h
3rdparty/pybind11/include/pybind11/eigen.h
3rdparty/pybind11/include/pybind11/embed.h
3rdparty/pybind11/include/pybind11/eval.h
3rdparty/pybind11/include/pybind11/functional.h
3rdparty/pybind11/include/pybind11/iostream.h
3rdparty/pybind11/include/pybind11/numpy.h
3rdparty/pybind11/include/pybind11/operators.h
3rdparty/pybind11/include/pybind11/options.h
3rdparty/pybind11/include/pybind11/pybind11.h
3rdparty/pybind11/include/pybind11/pytypes.h
3rdparty/pybind11/include/pybind11/stl.h
3rdparty/pybind11/include/pybind11/stl_bind.h
3rdparty/pybind11/include/pybind11/detail/class.h
3rdparty/pybind11/include/pybind11/detail/common.h
3rdparty/pybind11/include/pybind11/detail/descr.h
3rdparty/pybind11/include/pybind11/detail/init.h
3rdparty/pybind11/include/pybind11/detail/internals.h
3rdparty/pybind11/include/pybind11/detail/typeid.h
3rdparty/pybind11/tests/CMakeLists.txt
3rdparty/pybind11/tests/constructor_stats.h
3rdparty/pybind11/tests/cross_module_gil_utils.cpp
3rdparty/pybind11/tests/local_bindings.h
3rdparty/pybind11/tests/object.h
3rdparty/pybind11/tests/pybind11_cross_module_tests.cpp
3rdparty/pybind11/tests/pybind11_tests.cpp
3rdparty/pybind11/tests/pybind11_tests.h
3rdparty/pybind11/tests/test_async.cpp
3rdparty/pybind11/tests/test_buffers.cpp
3rdparty/pybind11/tests/test_builtin_casters.cpp
3rdparty/pybind11/tests/test_call_policies.cpp
3rdparty/pybind11/tests/test_callbacks.cpp
3rdparty/pybind11/tests/test_chrono.cpp
3rdparty/pybind11/tests/test_class.cpp
3rdparty/pybind11/tests/test_constants_and_functions.cpp
3rdparty/pybind11/tests/test_copy_move.cpp
3rdparty/pybind11/tests/test_docstring_options.cpp
3rdparty/pybind11/tests/test_eigen.cpp
3rdparty/pybind11/tests/test_enum.cpp
3rdparty/pybind11/tests/test_eval.cpp
3rdparty/pybind11/tests/test_exceptions.cpp
3rdparty/pybind11/tests/test_factory_constructors.cpp
3rdparty/pybind11/tests/test_gil_scoped.cpp
3rdparty/pybind11/tests/test_iostream.cpp
3rdparty/pybind11/tests/test_kwargs_and_defaults.cpp
3rdparty/pybind11/tests/test_local_bindings.cpp
3rdparty/pybind11/tests/test_methods_and_attributes.cpp
3rdparty/pybind11/tests/test_modules.cpp
3rdparty/pybind11/tests/test_multiple_inheritance.cpp
3rdparty/pybind11/tests/test_numpy_array.cpp
3rdparty/pybind11/tests/test_numpy_dtypes.cpp
3rdparty/pybind11/tests/test_numpy_vectorize.cpp
3rdparty/pybind11/tests/test_opaque_types.cpp
3rdparty/pybind11/tests/test_operator_overloading.cpp
3rdparty/pybind11/tests/test_pickling.cpp
3rdparty/pybind11/tests/test_pytypes.cpp
3rdparty/pybind11/tests/test_sequences_and_iterators.cpp
3rdparty/pybind11/tests/test_smart_ptr.cpp
3rdparty/pybind11/tests/test_stl.cpp
3rdparty/pybind11/tests/test_stl_binders.cpp
3rdparty/pybind11/tests/test_tagbased_polymorphic.cpp
3rdparty/pybind11/tests/test_union.cpp
3rdparty/pybind11/tests/test_virtual_functions.cpp
3rdparty/pybind11/tests/test_cmake_build/CMakeLists.txt
3rdparty/pybind11/tests/test_cmake_build/embed.cpp
3rdparty/pybind11/tests/test_cmake_build/main.cpp
3rdparty/pybind11/tests/test_cmake_build/installed_embed/CMakeLists.txt
3rdparty/pybind11/tests/test_cmake_build/installed_function/CMakeLists.txt
3rdparty/pybind11/tests/test_cmake_build/installed_target/CMakeLists.txt
3rdparty/pybind11/tests/test_cmake_build/subdirectory_embed/CMakeLists.txt
3rdparty/pybind11/tests/test_cmake_build/subdirectory_function/CMakeLists.txt
3rdparty/pybind11/tests/test_cmake_build/subdirectory_target/CMakeLists.txt
3rdparty/pybind11/tests/test_embed/CMakeLists.txt
3rdparty/pybind11/tests/test_embed/catch.cpp
3rdparty/pybind11/tests/test_embed/external_module.cpp
3rdparty/pybind11/tests/test_embed/test_interpreter.cpp
3rdparty/pybind11/tools/FindCatch.cmake
3rdparty/pybind11/tools/FindEigen3.cmake
3rdparty/pybind11/tools/FindPythonLibsNew.cmake
3rdparty/pybind11/tools/pybind11Tools.cmake
lightseq/__init__.py
lightseq.egg-info/PKG-INFO
lightseq.egg-info/SOURCES.txt
lightseq.egg-info/dependency_links.txt
lightseq.egg-info/entry_points.txt
lightseq.egg-info/not-zip-safe
lightseq.egg-info/requires.txt
lightseq.egg-info/top_level.txt
lightseq/csrc/example/CMakeLists.txt
lightseq/csrc/example/bert_example.cc
lightseq/csrc/kernels/CMakeLists.txt
lightseq/csrc/kernels/crf.cu
lightseq/csrc/kernels/cross_entropy.cu
lightseq/csrc/kernels/cublas_algo_map.cpp
lightseq/csrc/kernels/cublas_wrappers.cpp
lightseq/csrc/kernels/cublas_wrappers.cu
lightseq/csrc/kernels/cuda_util.cu
lightseq/csrc/kernels/dropout_kernels.cu
lightseq/csrc/kernels/embKernels.cc.cu
lightseq/csrc/kernels/embedding_kernels.cu
lightseq/csrc/kernels/fused_adam_kernel.cu
lightseq/csrc/kernels/gemm_test.cpp
lightseq/csrc/kernels/general_kernels.cu
lightseq/csrc/kernels/normalize_kernels.cu
lightseq/csrc/kernels/quantize_kernels.cu
lightseq/csrc/kernels/softmax_kernels.cu
lightseq/csrc/kernels/softmax_kernels_new.cu
lightseq/csrc/kernels/transform_kernels.cu
lightseq/csrc/kernels/transform_kernels_new.cu
lightseq/csrc/kernels/includes/block_reduce.h
lightseq/csrc/kernels/includes/common.h
lightseq/csrc/kernels/includes/cublas_algo_map.h
lightseq/csrc/kernels/includes/cublas_wrappers.h
lightseq/csrc/kernels/includes/cuda_util.h
lightseq/csrc/kernels/includes/embKernels.h
lightseq/csrc/kernels/includes/fused_adam_kernel.h
lightseq/csrc/kernels/includes/kernels.h
lightseq/csrc/kernels/includes/ls_cub.cuh
lightseq/csrc/kernels/includes/multi_tensor_apply.cuh
lightseq/csrc/layers/cross_entropy_layer.cpp
lightseq/csrc/layers/quant_linear_layer.cpp
lightseq/csrc/layers/transformer_decoder_layer.cpp
lightseq/csrc/layers/transformer_embedding_layer.cpp
lightseq/csrc/layers/transformer_encoder_layer.cpp
lightseq/csrc/layers/includes/cross_entropy_layer.h
lightseq/csrc/layers/includes/quant_linear_layer.h
lightseq/csrc/layers/includes/transformer_decoder_layer.h
lightseq/csrc/layers/includes/transformer_embedding_layer.h
lightseq/csrc/layers/includes/transformer_encoder_layer.h
lightseq/csrc/layers_new/CMakeLists.txt
lightseq/csrc/layers_new/crf_layer.cpp
lightseq/csrc/layers_new/dec_enc_attention_layer.cpp
lightseq/csrc/layers_new/dec_self_attention_layer.cpp
lightseq/csrc/layers_new/encdec_kv_layer.cpp
lightseq/csrc/layers_new/feed_forward_layer.cpp
lightseq/csrc/layers_new/linear_layer.cpp
lightseq/csrc/layers_new/multihead_attention_layer.cpp
lightseq/csrc/layers_new/transformer_decoder_layer.cpp
lightseq/csrc/layers_new/transformer_encoder_layer.cpp
lightseq/csrc/layers_new/includes/crf_layer.h
lightseq/csrc/layers_new/includes/dec_enc_attention_layer.h
lightseq/csrc/layers_new/includes/dec_self_attention_layer.h
lightseq/csrc/layers_new/includes/encdec_kv_layer.h
lightseq/csrc/layers_new/includes/feed_forward_layer.h
lightseq/csrc/layers_new/includes/launch_enc_emb_layer.h
lightseq/csrc/layers_new/includes/linear_layer.h
lightseq/csrc/layers_new/includes/lyr_normalize_layer.h
lightseq/csrc/layers_new/includes/multihead_attention_layer.h
lightseq/csrc/layers_new/includes/transformer_decoder_layer.h
lightseq/csrc/layers_new/includes/transformer_encoder_layer.h
lightseq/csrc/lsflow/CMakeLists.txt
lightseq/csrc/lsflow/context.cpp
lightseq/csrc/lsflow/layer.cpp
lightseq/csrc/lsflow/manager.cpp
lightseq/csrc/lsflow/node.cpp
lightseq/csrc/lsflow/tensor.cpp
lightseq/csrc/lsflow/includes/context.h
lightseq/csrc/lsflow/includes/declaration.h
lightseq/csrc/lsflow/includes/layer.h
lightseq/csrc/lsflow/includes/manager.h
lightseq/csrc/lsflow/includes/node.h
lightseq/csrc/lsflow/includes/tensor.h
lightseq/csrc/models/CMakeLists.txt
lightseq/csrc/models/bert.cc
lightseq/csrc/models/bert_crf.cc
lightseq/csrc/models/includes/bert.h
lightseq/csrc/models/includes/bert_crf.h
lightseq/csrc/models/includes/model_base.h
lightseq/csrc/ops/context.cpp
lightseq/csrc/ops/dropout.cpp
lightseq/csrc/ops/feed_forward.cpp
lightseq/csrc/ops/normalize_layer.cpp
lightseq/csrc/ops/softmax.cpp
lightseq/csrc/ops/strided_batch_gemm.cpp
lightseq/csrc/ops/includes/context.h
lightseq/csrc/ops/includes/dropout.h
lightseq/csrc/ops/includes/feed_forward.h
lightseq/csrc/ops/includes/normalize_layer.h
lightseq/csrc/ops/includes/softmax.h
lightseq/csrc/ops/includes/strided_batch_gemm.h
lightseq/csrc/ops_new/CMakeLists.txt
lightseq/csrc/ops_new/bias_act_dropout.cpp
lightseq/csrc/ops_new/bias_add_transform_20314.cpp
lightseq/csrc/ops_new/bias_dropout_residual.cpp
lightseq/csrc/ops_new/crf.cpp
lightseq/csrc/ops_new/dropout.cpp
lightseq/csrc/ops_new/launch_concat3_dim1.cpp
lightseq/csrc/ops_new/launch_enc_emb.cpp
lightseq/csrc/ops_new/layer_normalize.cpp
lightseq/csrc/ops_new/linear.cpp
lightseq/csrc/ops_new/softmax.cpp
lightseq/csrc/ops_new/strided_batch_gemm.cpp
lightseq/csrc/ops_new/transform_0213.cpp
lightseq/csrc/ops_new/includes/bias_act_dropout.h
lightseq/csrc/ops_new/includes/bias_add_transform_20314.h
lightseq/csrc/ops_new/includes/bias_dropout_residual.h
lightseq/csrc/ops_new/includes/crf.h
lightseq/csrc/ops_new/includes/dropout.h
lightseq/csrc/ops_new/includes/launch_concat3_dim1.h
lightseq/csrc/ops_new/includes/launch_enc_emb.h
lightseq/csrc/ops_new/includes/layer_normalize.h
lightseq/csrc/ops_new/includes/linear.h
lightseq/csrc/ops_new/includes/softmax.h
lightseq/csrc/ops_new/includes/strided_batch_gemm.h
lightseq/csrc/ops_new/includes/transform_0213.h
lightseq/csrc/proto/CMakeLists.txt
lightseq/csrc/proto/bert.proto
lightseq/csrc/proto/bert_crf.proto
lightseq/csrc/proto/bert_crf_weight.cc
lightseq/csrc/proto/bert_weight.cc
lightseq/csrc/proto/includes/bert_crf_weight.h
lightseq/csrc/proto/includes/bert_weight.h
lightseq/csrc/pybind/CMakeLists.txt
lightseq/csrc/pybind/pybind_adam.cpp
lightseq/csrc/pybind/pybind_kernel.cpp
lightseq/csrc/pybind/pybind_layer.cpp
lightseq/csrc/pybind/pybind_layer_new.cpp
lightseq/csrc/pybind/pybind_model.cpp
lightseq/csrc/pybind/pybind_op.cpp
lightseq/csrc/tools/CMakeLists.txt
lightseq/csrc/tools/util.cc.cu
lightseq/csrc/tools/includes/util.h
lightseq/inference/kernels/CMakeLists.txt
lightseq/inference/kernels/common.h
lightseq/inference/kernels/embKernels.cc.cu
lightseq/inference/kernels/embKernels.h
lightseq/inference/kernels/embKernels_int8.cc.cu
lightseq/inference/kernels/embKernels_int8.h
lightseq/inference/kernels/gptKernels.cc.cu
lightseq/inference/kernels/gptKernels.h
lightseq/inference/kernels/gptKernels_int8.cc.cu
lightseq/inference/kernels/gptKernels_int8.h
lightseq/inference/kernels/moeKernels.cc.cu
lightseq/inference/kernels/moeKernels.h
lightseq/inference/kernels/multilgKernels.cc.cu
lightseq/inference/kernels/multilgKernels.h
lightseq/inference/kernels/t5EmbKernels.cc.cu
lightseq/inference/kernels/t5EmbKernels.h
lightseq/inference/kernels/t5Kernels.cc.cu
lightseq/inference/kernels/t5Kernels.h
lightseq/inference/kernels/transformerKernels.cc.cu
lightseq/inference/kernels/transformerKernels.h
lightseq/inference/kernels/transformerKernels_int8.cc.cu
lightseq/inference/kernels/transformerKernels_int8.h
lightseq/inference/model/CMakeLists.txt
lightseq/inference/model/bert_encoder.cc.cu
lightseq/inference/model/bert_encoder.h
lightseq/inference/model/cublas_algo_map.cc
lightseq/inference/model/cublas_algo_map.h
lightseq/inference/model/cublas_helper.cc
lightseq/inference/model/cublas_helper.h
lightseq/inference/model/decoder.cc.cu
lightseq/inference/model/decoder.h
lightseq/inference/model/encoder.cc.cu
lightseq/inference/model/encoder.h
lightseq/inference/model/gpt_encoder.cc.cu
lightseq/inference/model/gpt_encoder.h
lightseq/inference/model/moe_decoder.cc.cu
lightseq/inference/model/moe_decoder.h
lightseq/inference/model/moe_encoder.cc.cu
lightseq/inference/model/moe_encoder.h
lightseq/inference/model/mt5_decoder.cc.cu
lightseq/inference/model/mt5_decoder.h
lightseq/inference/model/mt5_encoder.cc.cu
lightseq/inference/model/mt5_encoder.h
lightseq/inference/model/quant_bert_encoder.cc.cu
lightseq/inference/model/quant_bert_encoder.h
lightseq/inference/model/quant_decoder.cc.cu
lightseq/inference/model/quant_decoder.h
lightseq/inference/model/quant_encoder.cc.cu
lightseq/inference/model/quant_encoder.h
lightseq/inference/model/quant_gpt_encoder.cc.cu
lightseq/inference/model/quant_gpt_encoder.h
lightseq/inference/model/quant_vit_encoder.cc.cu
lightseq/inference/model/quant_vit_encoder.h
lightseq/inference/model/t5_decoder.cc.cu
lightseq/inference/model/t5_decoder.h
lightseq/inference/model/t5_encoder.cc.cu
lightseq/inference/model/t5_encoder.h
lightseq/inference/model/vit_encoder.cc.cu
lightseq/inference/model/vit_encoder.h
lightseq/inference/proto/CMakeLists.txt
lightseq/inference/proto/bert.proto
lightseq/inference/proto/bert_weight.cc
lightseq/inference/proto/bert_weight.h
lightseq/inference/proto/gpt.proto
lightseq/inference/proto/gpt_weight.cc
lightseq/inference/proto/gpt_weight.h
lightseq/inference/proto/moe.proto
lightseq/inference/proto/moe_weight.cc
lightseq/inference/proto/moe_weight.h
lightseq/inference/proto/mt5.proto
lightseq/inference/proto/mt5_weight.cc
lightseq/inference/proto/mt5_weight.h
lightseq/inference/proto/quant_bert.proto
lightseq/inference/proto/quant_bert_weight.cc
lightseq/inference/proto/quant_bert_weight.h
lightseq/inference/proto/quant_gpt.proto
lightseq/inference/proto/quant_gpt_weight.cc
lightseq/inference/proto/quant_gpt_weight.h
lightseq/inference/proto/quant_transformer.proto
lightseq/inference/proto/quant_transformer_weight.cc
lightseq/inference/proto/quant_transformer_weight.h
lightseq/inference/proto/quant_vit.proto
lightseq/inference/proto/quant_vit_weight.cc
lightseq/inference/proto/quant_vit_weight.h
lightseq/inference/proto/t5.proto
lightseq/inference/proto/t5_weight.cc
lightseq/inference/proto/t5_weight.h
lightseq/inference/proto/transformer.proto
lightseq/inference/proto/transformer_weight.cc
lightseq/inference/proto/transformer_weight.h
lightseq/inference/proto/vit.proto
lightseq/inference/proto/vit_weight.cc
lightseq/inference/proto/vit_weight.h
lightseq/inference/pywrapper/CMakeLists.txt
lightseq/inference/pywrapper/bert.cc
lightseq/inference/pywrapper/bert.h
lightseq/inference/pywrapper/gpt.cc
lightseq/inference/pywrapper/gpt.h
lightseq/inference/pywrapper/model_base.h
lightseq/inference/pywrapper/moe.cc
lightseq/inference/pywrapper/moe.h
lightseq/inference/pywrapper/mt5.cc
lightseq/inference/pywrapper/mt5.h
lightseq/inference/pywrapper/quant_bert.cc
lightseq/inference/pywrapper/quant_bert.h
lightseq/inference/pywrapper/quant_gpt.cc
lightseq/inference/pywrapper/quant_gpt.h
lightseq/inference/pywrapper/quant_transformer.cc
lightseq/inference/pywrapper/quant_transformer.h
lightseq/inference/pywrapper/quant_vit.cc
lightseq/inference/pywrapper/quant_vit.h
lightseq/inference/pywrapper/t5.cc
lightseq/inference/pywrapper/t5.h
lightseq/inference/pywrapper/transformer.cc
lightseq/inference/pywrapper/transformer.h
lightseq/inference/pywrapper/transformer_decoder.cc.cu
lightseq/inference/pywrapper/vit.cc
lightseq/inference/pywrapper/vit.h
lightseq/inference/pywrapper/wrapper.cc
lightseq/inference/server/CMakeLists.txt
lightseq/inference/server/custom.h
lightseq/inference/server/decoder_generate_server.cc.cu
lightseq/inference/server/generate_server.cc.cu
lightseq/inference/server/gpt_generate_server.cc.cu
lightseq/inference/server/gptlm_server.cc.cu
lightseq/inference/server/libserver.ldscript
lightseq/inference/server/model_config.h
lightseq/inference/server/model_config.proto
lightseq/inference/server/model_config_cuda.h
lightseq/inference/server/moe_server.cc.cu
lightseq/inference/server/transformer_server.cc.cu
lightseq/inference/tools/CMakeLists.txt
lightseq/inference/tools/util.cc.cu
lightseq/inference/tools/util.h
lightseq/inference/triton_backend/CMakeLists.txt
lightseq/inference/triton_backend/src/libtriton_minimal.ldscript
lightseq/inference/triton_backend/src/lightseq_backend.cc
lightseq/inference/triton_backend/src/triton_model.h
lightseq/inference/triton_backend/src/triton_utils.h
lightseq/training/__init__.py
lightseq/training/cli/__init__.py
lightseq/training/cli/lightseq_deepspeed_cli.py
lightseq/training/cli/lightseq_fairseq_generate_cli.py
lightseq/training/cli/lightseq_fairseq_train_cli.py
lightseq/training/cli/lightseq_fairseq_validate_cli.py
lightseq/training/cli/lightseq_infer_cli.py
lightseq/training/cli/fs_modules/__init__.py
lightseq/training/cli/fs_modules/ls_adam.py
lightseq/training/cli/fs_modules/ls_bart.py
lightseq/training/cli/fs_modules/ls_fs_transformer_decoder_layer.py
lightseq/training/cli/fs_modules/ls_label_smoothed_cross_entropy.py
lightseq/training/cli/fs_modules/ls_transformer.py
lightseq/training/cli/fs_modules/ls_translation.py
lightseq/training/csrc/ops/includes/strided_batch_gemm.h
lightseq/training/gcq/__init__.py
lightseq/training/gcq/gcq.py
lightseq/training/gcq/ls_fs_gcq_train.py
lightseq/training/gcq/ls_fs_gcq_trainer.py
lightseq/training/ops/__init__.py
lightseq/training/ops/pytorch/__init__.py
lightseq/training/ops/pytorch/adam.py
lightseq/training/ops/pytorch/cross_entropy_layer.py
lightseq/training/ops/pytorch/export.py
lightseq/training/ops/pytorch/export_quant.py
lightseq/training/ops/pytorch/gemm_test.py
lightseq/training/ops/pytorch/gpt_layer.py
lightseq/training/ops/pytorch/layer_base.py
lightseq/training/ops/pytorch/quant_linear_layer.py
lightseq/training/ops/pytorch/quantization.py
lightseq/training/ops/pytorch/torch_transformer_layers.py
lightseq/training/ops/pytorch/transformer.py
lightseq/training/ops/pytorch/transformer_decoder_layer.py
lightseq/training/ops/pytorch/transformer_decoder_layer_new.py
lightseq/training/ops/pytorch/transformer_embedding_layer.py
lightseq/training/ops/pytorch/transformer_encoder_layer.py
lightseq/training/ops/pytorch/transformer_encoder_layer_new.py
lightseq/training/ops/pytorch/util.py
lightseq/training/ops/pytorch/builder/__init__.py
lightseq/training/ops/pytorch/builder/adam_builder.py
lightseq/training/ops/pytorch/builder/builder.py
lightseq/training/ops/pytorch/builder/kernel_builder.py
lightseq/training/ops/pytorch/builder/layer_builder.py
lightseq/training/ops/pytorch/builder/operator_builder.py
lightseq/training/ops/pytorch/builder/transformer_builder.py
lightseq/training/ops/tensorflow/__init__.py
lightseq/training/pytorch_quantization/__init__.py
lightseq/training/pytorch_quantization/quant_modules.py
lightseq/training/pytorch_quantization/tensor_quant.py
lightseq/training/pytorch_quantization/version.py
lightseq/training/pytorch_quantization/calib/__init__.py
lightseq/training/pytorch_quantization/calib/calibrator.py
lightseq/training/pytorch_quantization/calib/histogram.py
lightseq/training/pytorch_quantization/calib/max.py
lightseq/training/pytorch_quantization/nn/__init__.py
lightseq/training/pytorch_quantization/nn/functional.py
lightseq/training/pytorch_quantization/nn/_functions/__init__.py
lightseq/training/pytorch_quantization/nn/_functions/quant_rnn.py
lightseq/training/pytorch_quantization/nn/modules/__init__.py
lightseq/training/pytorch_quantization/nn/modules/_utils.py
lightseq/training/pytorch_quantization/nn/modules/clip.py
lightseq/training/pytorch_quantization/nn/modules/quant_bert.py
lightseq/training/pytorch_quantization/nn/modules/quant_conv.py
lightseq/training/pytorch_quantization/nn/modules/quant_instancenorm.py
lightseq/training/pytorch_quantization/nn/modules/quant_linear.py
lightseq/training/pytorch_quantization/nn/modules/quant_pooling.py
lightseq/training/pytorch_quantization/nn/modules/quant_rnn.py
lightseq/training/pytorch_quantization/nn/modules/tensor_quantizer.py
lightseq/training/pytorch_quantization/optim/__init__.py
lightseq/training/pytorch_quantization/optim/helper.py
lightseq/training/pytorch_quantization/utils/__init__.py
lightseq/training/pytorch_quantization/utils/quant_logging.py
lightseq/training/pytorch_quantization/utils/reduce_amax.py