This is an automated email from the ASF dual-hosted git repository.
github-actions[bot] pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git
from dcbebe7bfd [Relax][Frontend][TFLite] Add UNIDIRECTIONAL_SEQUENCE_RNN
converter (#19601)
add de89da6b18 [IR] Rename Call annotations to attrs (#19618)
add f0ac8d62ef [REFACTOR][RUNTIME] Phase out tvm::runtime::regex_match
(#19620)
add 6c27733258 [REFACTOR][RUNTIME] Remove leftover microTVM/CRT crumbs
(#19622)
add 66a4bcd401 [REFACTOR][RUNTIME] Relocate nvtx.h to tvm/support/cuda and
make it header-only (#19621)
add ffea531107 [REFACTOR][PYTHON] Lift compiler/CLI/process modules from
tvm.contrib to tvm.support (#19624)
add 2f4f4b1de3 [REFACTOR][IR][FFI] Bump tvm-ffi (+ SEqHashDef migration)
and phase out tvm/ir/repr.h (#19627)
add 4bcf694cbf [REFACTOR][IR] Inline ReplaceGlobalVars into
AttachGlobalSymbol (#19625)
add 7c21470a38 [BugFix][Vulkan][CodeGen] Change OpControlBarrier to
AcquireRelease (#19619)
add 23db01f1fa [REFACTOR][RUNTIME] Structural reorganization: locality
moves for thread_map, texture, minrpc, disco, contrib (#19628)
add 61ae85b9d1 [REFACTOR][PYTHON] Consolidate derived_object into
tvm.ir.utils (#19630)
No new revisions were added by this update.
Summary of changes:
3rdparty/tvm-ffi | 2 +-
CMakeLists.txt | 20 +-
apps/android_rpc/app/src/main/jni/tvm_runtime.h | 6 +-
apps/android_rpc/tests/android_rpc_test.py | 2 +-
apps/ios_rpc/tests/ios_rpc_test.py | 2 +-
cmake/modules/CUDA.cmake | 12 +-
cmake/modules/Hexagon.cmake | 4 +-
cmake/modules/ROCM.cmake | 6 +-
cmake/modules/contrib/AMX.cmake | 2 +-
cmake/modules/contrib/BLAS.cmake | 8 +-
cmake/modules/contrib/CLML.cmake | 4 +-
cmake/modules/contrib/CUTLASS.cmake | 16 +-
cmake/modules/contrib/CoreML.cmake | 2 +-
cmake/modules/contrib/DNNL.cmake | 22 +-
cmake/modules/contrib/ExampleNPU.cmake | 4 +-
cmake/modules/contrib/NNAPI.cmake | 4 +-
cmake/modules/contrib/Random.cmake | 2 +-
cmake/modules/contrib/Sort.cmake | 2 +-
cmake/modules/contrib/TensorRT.cmake | 4 +-
cmake/modules/contrib/vllm.cmake | 4 +-
cmake/utils/CRTConfig.cmake | 35 --
docs/conf.py | 3 +-
docs/how_to/tutorials/cross_compilation_and_rpc.py | 2 +-
docs/reference/api/python/contrib.rst | 66 ---
docs/reference/api/python/support.rst | 50 ++
include/tvm/ir/expr.h | 2 +-
include/tvm/ir/replace_global_vars.h | 57 --
include/tvm/ir/repr.h | 72 ---
include/tvm/relax/exec_builder.h | 2 +-
include/tvm/relax/expr.h | 9 +-
include/tvm/relax/struct_info.h | 2 +-
include/tvm/{runtime => support/cuda}/nvtx.h | 48 +-
include/tvm/tirx/buffer.h | 15 +-
include/tvm/tirx/exec_scope.h | 2 +-
include/tvm/tirx/expr.h | 23 +-
include/tvm/tirx/function.h | 2 +-
include/tvm/tirx/index_map.h | 2 +-
include/tvm/tirx/predicate.h | 2 +-
include/tvm/tirx/stmt.h | 10 +-
include/tvm/tirx/var.h | 2 +-
python/tvm/__init__.py | 4 +-
python/tvm/contrib/cutlass/build.py | 2 +-
python/tvm/contrib/hexagon/hexagon_profiler.py | 2 +-
python/tvm/contrib/hexagon/meta_schedule.py | 5 +-
python/tvm/contrib/hexagon/session.py | 2 +-
python/tvm/contrib/hexagon/tools.py | 2 +-
python/tvm/contrib/rpc.py | 28 -
python/tvm/contrib/spirv.py | 59 --
python/tvm/contrib/tvmjs.py | 3 +-
python/tvm/exec/popen_worker.py | 2 +-
python/tvm/ir/attrs.py | 10 +
python/tvm/ir/module.py | 27 -
python/tvm/{runtime/support.py => ir/utils.py} | 54 +-
python/tvm/relax/backend/cuda/flashinfer.py | 2 +-
python/tvm/relax/backend/metal/coreml.py | 2 +-
python/tvm/relax/expr_functor.py | 2 +-
python/tvm/relax/frontend/nn/extern.py | 2 +-
python/tvm/rpc/client.py | 2 +-
python/tvm/rpc/minrpc.py | 4 +-
python/tvm/rpc/proxy.py | 2 +-
python/tvm/rpc/server.py | 10 +-
python/tvm/rpc/tracker.py | 2 +-
python/tvm/runtime/__init__.py | 1 -
python/tvm/runtime/executable.py | 2 +-
python/tvm/runtime/module.py | 14 +-
python/tvm/s_tir/meta_schedule/__init__.py | 1 -
.../s_tir/meta_schedule/builder/local_builder.py | 7 +-
.../s_tir/meta_schedule/cost_model/mlp_model.py | 5 +-
.../s_tir/meta_schedule/cost_model/random_model.py | 3 +-
.../s_tir/meta_schedule/cost_model/xgb_model.py | 6 +-
.../feature_extractor/random_feature_extractor.py | 2 +-
.../tvm/s_tir/meta_schedule/runner/local_runner.py | 5 +-
.../tvm/s_tir/meta_schedule/runner/rpc_runner.py | 4 +-
.../meta_schedule/testing/custom_builder_runner.py | 2 +-
.../s_tir/meta_schedule/testing/dummy_object.py | 2 +-
python/tvm/s_tir/meta_schedule/utils.py | 140 -----
python/tvm/support.py | 102 ----
python/tvm/support/__init__.py | 54 ++
python/tvm/{contrib => support}/cc.py | 2 +-
python/tvm/{contrib => support}/clang.py | 0
python/tvm/{contrib => support}/emcc.py | 0
python/tvm/support/libinfo.py | 45 ++
python/tvm/{contrib => support}/ndk.py | 0
python/tvm/{contrib => support}/nvcc.py | 0
python/tvm/{contrib => support}/popen_pool.py | 0
python/tvm/{contrib => support}/rocm.py | 0
python/tvm/{contrib => support}/tar.py | 2 +-
python/tvm/{contrib => support}/utils.py | 0
python/tvm/{contrib => support}/xcode.py | 0
python/tvm/testing/runner.py | 2 +-
python/tvm/testing/utils.py | 13 +-
python/tvm/tirx/bench.py | 2 +-
python/tvm/tirx/expr.py | 14 +-
python/tvm/tirx/expr_functor.py | 2 +-
python/tvm/tirx/functor.py | 35 +-
python/tvm/tirx/op.py | 12 +-
python/tvm/tirx/operator/intrinsics/cuda/header.py | 2 +-
python/tvm/tirx/script/builder/external_kernel.py | 2 +-
src/arith/ir_mutator_with_analyzer.cc | 2 +-
src/arith/rewrite_simplify.cc | 4 +-
src/ir/{repr.cc => access_path_repr.cc} | 19 +-
src/ir/instrument.cc | 2 +-
src/ir/replace_global_vars.cc | 110 ----
src/ir/transform.cc | 2 +-
.../backend/contrib/codegen_json/codegen_json.h | 4 +-
src/relax/ir/dataflow_pattern.cc | 1 -
src/relax/ir/transform.cc | 2 +-
src/relax/transform/attach_global_symbol.cc | 106 +++-
src/relax/transform/replace_global_vars.cc | 83 ---
src/relax/transform/static_plan_block_memory.cc | 2 +-
src/relax/transform/update_param_struct_info.cc | 1 -
src/runtime/crt/common/crt_runtime_api.c | 659 ---------------------
src/runtime/{ => extra}/contrib/amx/amx_config.cc | 0
src/runtime/{ => extra}/contrib/cblas/cblas.cc | 0
src/runtime/{ => extra}/contrib/cblas/dnnl_blas.cc | 0
.../{ => extra}/contrib/cblas/gemm_common.h | 0
src/runtime/{ => extra}/contrib/cblas/mkl.cc | 0
.../contrib/clml/clml_memory_planner.cc | 0
.../{ => extra}/contrib/clml/clml_memory_planner.h | 0
.../{ => extra}/contrib/clml/clml_runtime.cc | 2 +-
.../{ => extra}/contrib/clml/clml_runtime.h | 6 +-
src/runtime/{ => extra}/contrib/clml/clml_utils.cc | 0
src/runtime/{ => extra}/contrib/clml/clml_utils.h | 0
.../{ => extra}/contrib/coreml/coreml_runtime.h | 0
.../{ => extra}/contrib/coreml/coreml_runtime.mm | 2 +-
src/runtime/{ => extra}/contrib/cublas/cublas.cc | 2 +-
.../contrib/cublas/cublas_json_runtime.cc | 2 +-
.../{ => extra}/contrib/cublas/cublas_utils.cc | 2 +-
.../{ => extra}/contrib/cublas/cublas_utils.h | 0
.../{ => extra}/contrib/cudnn/conv_backward.cc | 0
.../{ => extra}/contrib/cudnn/conv_forward.cc | 0
.../contrib/cudnn/cudnn_frontend/attention.cc | 2 +-
.../contrib/cudnn/cudnn_frontend/attention.h | 0
.../contrib/cudnn/cudnn_json_runtime.cc | 0
.../{ => extra}/contrib/cudnn/cudnn_utils.cc | 0
.../{ => extra}/contrib/cudnn/cudnn_utils.h | 2 +-
src/runtime/{ => extra}/contrib/cudnn/softmax.cc | 0
src/runtime/{ => extra}/contrib/curand/curand.cc | 2 +-
.../contrib/curand/helper_cuda_kernels.cu | 0
.../contrib/curand/helper_cuda_kernels.h | 0
.../contrib/cutlass/fp16_group_gemm.cuh | 0
.../cutlass/fp16_group_gemm_runner_sm100.cuh | 2 +-
.../cutlass/fp16_group_gemm_runner_sm90.cuh | 2 +-
.../contrib/cutlass/fp16_group_gemm_sm100.cu | 0
.../contrib/cutlass/fp16_group_gemm_sm90.cu | 0
.../{ => extra}/contrib/cutlass/fp8_gemm.cu | 0
.../contrib/cutlass/fp8_group_gemm_sm90.cu | 0
.../contrib/cutlass/fp8_groupwise_scaled_gemm.cuh | 0
.../fp8_groupwise_scaled_gemm_runner_sm100.cuh | 2 +-
.../fp8_groupwise_scaled_gemm_runner_sm90.cuh | 2 +-
.../cutlass/fp8_groupwise_scaled_gemm_sm100.cu | 0
.../cutlass/fp8_groupwise_scaled_gemm_sm90.cu | 0
...p8_groupwise_scaled_group_gemm_runner_sm100.cuh | 2 +-
.../fp8_groupwise_scaled_group_gemm_sm100.cu | 0
.../{ => extra}/contrib/cutlass/gemm_runner.cuh | 2 +-
.../contrib/cutlass/weight_preprocess.cc | 0
src/runtime/{ => extra}/contrib/dnnl/dnnl.cc | 0
.../{ => extra}/contrib/dnnl/dnnl_json_runtime.cc | 60 +-
src/runtime/{ => extra}/contrib/dnnl/dnnl_kernel.h | 0
.../contrib/dnnl/dnnl_tensor_requisite.h | 0
src/runtime/{ => extra}/contrib/dnnl/dnnl_utils.cc | 0
src/runtime/{ => extra}/contrib/dnnl/dnnl_utils.h | 0
.../contrib/example_npu/example_npu_runtime.cc | 0
src/runtime/{ => extra}/contrib/hipblas/hipblas.cc | 2 +-
.../contrib/hipblas/hipblas_json_runtime.cc | 2 +-
.../{ => extra}/contrib/hipblas/hipblas_utils.cc | 2 +-
.../{ => extra}/contrib/hipblas/hipblas_utils.h | 0
src/runtime/{ => extra}/contrib/json/json_node.h | 0
.../{ => extra}/contrib/json/json_runtime.h | 2 +-
.../{ => extra}/contrib/nnapi/nnapi_builder.cc | 0
.../{ => extra}/contrib/nnapi/nnapi_builder.h | 0
src/runtime/{ => extra}/contrib/nnapi/nnapi_ops.cc | 0
src/runtime/{ => extra}/contrib/nnapi/nnapi_ops.h | 0
.../{ => extra}/contrib/nnapi/nnapi_runtime.cc | 0
.../{ => extra}/contrib/nvshmem/dist_gemm.cu | 2 +-
src/runtime/{ => extra}/contrib/nvshmem/init.cc | 2 +-
.../{ => extra}/contrib/nvshmem/kv_transfer.cu | 0
.../contrib/nvshmem/memory_allocator.cc | 4 +-
.../{ => extra}/contrib/random/mt_random_engine.cc | 0
src/runtime/{ => extra}/contrib/random/random.cc | 0
src/runtime/{ => extra}/contrib/sort/sort.cc | 2 +-
.../contrib/tensorrt/tensorrt_builder.cc | 0
.../contrib/tensorrt/tensorrt_builder.h | 0
.../contrib/tensorrt/tensorrt_calibrator.h | 2 +-
.../{ => extra}/contrib/tensorrt/tensorrt_logger.h | 0
.../{ => extra}/contrib/tensorrt/tensorrt_ops.cc | 0
.../{ => extra}/contrib/tensorrt/tensorrt_ops.h | 0
.../contrib/tensorrt/tensorrt_runtime.cc | 4 +-
.../{ => extra}/contrib/tensorrt/tensorrt_utils.h | 0
src/runtime/{ => extra}/contrib/thrust/thrust.cu | 2 +-
.../{ => extra}/contrib/vllm/attention_kernels.cu | 0
.../{ => extra}/contrib/vllm/attention_utils.cuh | 0
.../{ => extra}/contrib/vllm/cache_alloc.cc | 0
.../{ => extra}/contrib/vllm/cache_kernels.cu | 0
.../{ => extra}/contrib/vllm/dtype_float16.h | 0
src/runtime/{ => extra}/disco/bcast_session.cc | 0
src/runtime/{ => extra}/disco/bcast_session.h | 0
src/runtime/{ => extra}/disco/builtin.cc | 0
.../{ => extra}/disco/cuda_ipc/cuda_ipc_memory.cc | 6 +-
.../{ => extra}/disco/cuda_ipc/custom_allreduce.cc | 2 +-
src/runtime/{ => extra}/disco/disco_worker.cc | 2 +-
.../{ => extra}/disco/disco_worker_thread.h | 0
.../disco/distributed/socket_session.cc | 2 +-
src/runtime/{ => extra}/disco/loader.cc | 2 +-
src/runtime/{ => extra}/disco/message_queue.h | 0
src/runtime/{ => extra}/disco/nccl/nccl.cc | 2 +-
src/runtime/{ => extra}/disco/nccl/nccl_context.h | 6 +-
src/runtime/{ => extra}/disco/process_session.cc | 4 +-
src/runtime/{ => extra}/disco/protocol.h | 8 +-
src/runtime/{ => extra}/disco/session.cc | 0
src/runtime/{ => extra}/disco/threaded_session.cc | 4 +-
src/runtime/{ => extra}/disco/utils.h | 0
src/runtime/hexagon/rpc/hexagon/rpc_server.cc | 2 +-
src/runtime/hexagon/rpc/simulator/rpc_server.cc | 2 +-
src/runtime/meta_data.h | 79 ---
src/runtime/nvtx.cc | 42 --
src/runtime/opencl/opencl_common.h | 2 +-
src/runtime/{ => opencl}/texture.h | 6 +-
src/runtime/regex.cc | 43 --
src/runtime/regex.h | 67 ---
src/runtime/{ => rpc}/minrpc/minrpc_server.h | 0
.../posix_popen_server/posix_popen_server.cc | 0
src/runtime/{ => rpc}/minrpc/rpc_reference.h | 0
src/runtime/rpc/rpc_endpoint.h | 2 +-
src/runtime/rpc/rpc_session.h | 2 +-
src/runtime/vm/attn_utils.h | 2 +-
src/runtime/vm/paged_kv_cache.cc | 4 +-
src/runtime/vm/vm.cc | 4 +-
src/runtime/{ => vulkan}/thread_map.h | 6 +-
src/runtime/vulkan/vulkan_device.h | 2 +-
src/runtime/vulkan/vulkan_device_api.h | 2 +-
src/s_tir/backend/adreno/inject_texture_alloc.cc | 2 +-
src/s_tir/backend/adreno/texture_flatten.cc | 2 +-
src/s_tir/transform/inject_software_pipeline.cc | 6 +-
src/script/printer/script_printer.cc | 1 -
src/target/opencl/codegen_opencl.cc | 2 +-
src/target/vulkan/codegen_spirv.cc | 2 +-
src/tirx/analysis/deep_equal.cc | 4 +-
src/tirx/ir/data_type_rewriter.cc | 5 +-
src/tirx/ir/expr.cc | 18 +-
src/tirx/ir/expr_functor.cc | 2 +-
src/tirx/ir/transform.cc | 2 +-
src/tirx/script/printer/expr.cc | 4 +-
src/tirx/transform/lower_warp_memory.cc | 2 +-
src/tirx/transform/replace_global_vars.cc | 84 ---
src/tirx/transform/storage_rewrite.cc | 2 +-
src/tirx/transform/tile_primitive_dispatch.cc | 2 +-
src/tirx/transform/unsupported_dtype_legalize.cc | 5 +-
src/tirx/transform/vectorize_loop.cc | 18 +-
.../test_minimal_target_codegen_llvm.py | 2 +-
tests/python/codegen/test_gpu_codegen_allreduce.py | 2 +-
tests/python/codegen/test_inject_ptx_ldg32.py | 4 +-
tests/python/codegen/test_target_codegen_blob.py | 2 +-
tests/python/codegen/test_target_codegen_c_host.py | 2 +-
.../codegen/test_target_codegen_cross_llvm.py | 2 +-
tests/python/codegen/test_target_codegen_cuda.py | 10 +-
.../codegen/test_target_codegen_cuda_fastmath.py | 2 +-
tests/python/codegen/test_target_codegen_llvm.py | 2 +-
tests/python/codegen/test_target_codegen_metal.py | 2 +-
tests/python/contrib/test_ccache.py | 2 +-
tests/python/contrib/test_coreml_runtime.py | 3 +-
tests/python/contrib/test_popen_pool.py | 2 +-
tests/python/contrib/test_util.py | 2 +-
.../python/ir/test_transform_replace_global_var.py | 308 ----------
tests/python/nightly/test_nnapi/infrastructure.py | 2 +-
tests/python/relax/backend/adreno/utils.py | 2 +-
tests/python/relax/test_codegen_coreml.py | 4 +-
tests/python/relax/test_runtime_builtin.py | 3 +-
.../relax/test_runtime_sampling_flashinfer.py | 2 +-
tests/python/relax/test_transform_codegen_pass.py | 2 +-
tests/python/relax/test_vm_build.py | 2 +-
tests/python/relax/test_vm_codegen_only.py | 2 +-
tests/python/relax/texture/test_texture_nd.py | 2 +-
tests/python/runtime/test_runtime_measure.py | 2 +-
tests/python/runtime/test_runtime_module_export.py | 2 +-
tests/python/runtime/test_runtime_module_load.py | 2 +-
tests/python/runtime/test_runtime_rpc.py | 2 +-
.../meta_schedule/test_meta_schedule_cost_model.py | 2 +-
.../meta_schedule/test_meta_schedule_database.py | 5 +-
.../test_meta_schedule_feature_extractor.py | 2 +-
.../test_meta_schedule_measure_callback.py | 15 +-
.../test_meta_schedule_post_order_apply.py | 2 +-
.../meta_schedule/test_meta_schedule_runner.py | 2 +-
.../test_meta_schedule_search_strategy.py | 2 +-
.../test_meta_schedule_space_generator.py | 2 +-
.../test_meta_schedule_task_scheduler.py | 7 +-
.../meta_schedule/test_meta_schedule_tune_tir.py | 3 +-
.../test_s_tir_transform_inject_ptx_async_copy.py | 4 +-
tests/python/target/test_arm_target.py | 2 +-
tests/python/tirx-base/test_tir_constructor.py | 40 +-
tests/python/tirx-base/test_tir_intrin.py | 2 +-
tests/python/tirx/codegen/test_codegen_nvshmem.py | 2 +-
web/emcc/wasm_runtime.cc | 3 +-
web/tests/python/relax_rpc_test.py | 3 +-
web/tests/python/webgpu_rpc_test.py | 3 +-
295 files changed, 729 insertions(+), 2578 deletions(-)
delete mode 100644 cmake/utils/CRTConfig.cmake
delete mode 100644 include/tvm/ir/replace_global_vars.h
delete mode 100644 include/tvm/ir/repr.h
rename include/tvm/{runtime => support/cuda}/nvtx.h (56%)
delete mode 100644 python/tvm/contrib/rpc.py
delete mode 100644 python/tvm/contrib/spirv.py
rename python/tvm/{runtime/support.py => ir/utils.py} (77%)
delete mode 100644 python/tvm/support.py
create mode 100644 python/tvm/support/__init__.py
rename python/tvm/{contrib => support}/cc.py (99%)
rename python/tvm/{contrib => support}/clang.py (100%)
rename python/tvm/{contrib => support}/emcc.py (100%)
create mode 100644 python/tvm/support/libinfo.py
rename python/tvm/{contrib => support}/ndk.py (100%)
rename python/tvm/{contrib => support}/nvcc.py (100%)
rename python/tvm/{contrib => support}/popen_pool.py (100%)
rename python/tvm/{contrib => support}/rocm.py (100%)
rename python/tvm/{contrib => support}/tar.py (98%)
rename python/tvm/{contrib => support}/utils.py (100%)
rename python/tvm/{contrib => support}/xcode.py (100%)
rename src/ir/{repr.cc => access_path_repr.cc} (87%)
delete mode 100644 src/ir/replace_global_vars.cc
delete mode 100644 src/relax/transform/replace_global_vars.cc
delete mode 100644 src/runtime/crt/common/crt_runtime_api.c
rename src/runtime/{ => extra}/contrib/amx/amx_config.cc (100%)
rename src/runtime/{ => extra}/contrib/cblas/cblas.cc (100%)
rename src/runtime/{ => extra}/contrib/cblas/dnnl_blas.cc (100%)
rename src/runtime/{ => extra}/contrib/cblas/gemm_common.h (100%)
rename src/runtime/{ => extra}/contrib/cblas/mkl.cc (100%)
rename src/runtime/{ => extra}/contrib/clml/clml_memory_planner.cc (100%)
rename src/runtime/{ => extra}/contrib/clml/clml_memory_planner.h (100%)
rename src/runtime/{ => extra}/contrib/clml/clml_runtime.cc (99%)
rename src/runtime/{ => extra}/contrib/clml/clml_runtime.h (99%)
rename src/runtime/{ => extra}/contrib/clml/clml_utils.cc (100%)
rename src/runtime/{ => extra}/contrib/clml/clml_utils.h (100%)
rename src/runtime/{ => extra}/contrib/coreml/coreml_runtime.h (100%)
rename src/runtime/{ => extra}/contrib/coreml/coreml_runtime.mm (99%)
rename src/runtime/{ => extra}/contrib/cublas/cublas.cc (99%)
rename src/runtime/{ => extra}/contrib/cublas/cublas_json_runtime.cc (99%)
rename src/runtime/{ => extra}/contrib/cublas/cublas_utils.cc (98%)
rename src/runtime/{ => extra}/contrib/cublas/cublas_utils.h (100%)
rename src/runtime/{ => extra}/contrib/cudnn/conv_backward.cc (100%)
rename src/runtime/{ => extra}/contrib/cudnn/conv_forward.cc (100%)
rename src/runtime/{ => extra}/contrib/cudnn/cudnn_frontend/attention.cc (99%)
rename src/runtime/{ => extra}/contrib/cudnn/cudnn_frontend/attention.h (100%)
rename src/runtime/{ => extra}/contrib/cudnn/cudnn_json_runtime.cc (100%)
rename src/runtime/{ => extra}/contrib/cudnn/cudnn_utils.cc (100%)
rename src/runtime/{ => extra}/contrib/cudnn/cudnn_utils.h (99%)
rename src/runtime/{ => extra}/contrib/cudnn/softmax.cc (100%)
rename src/runtime/{ => extra}/contrib/curand/curand.cc (99%)
rename src/runtime/{ => extra}/contrib/curand/helper_cuda_kernels.cu (100%)
rename src/runtime/{ => extra}/contrib/curand/helper_cuda_kernels.h (100%)
rename src/runtime/{ => extra}/contrib/cutlass/fp16_group_gemm.cuh (100%)
rename src/runtime/{ =>
extra}/contrib/cutlass/fp16_group_gemm_runner_sm100.cuh (99%)
rename src/runtime/{ => extra}/contrib/cutlass/fp16_group_gemm_runner_sm90.cuh
(99%)
rename src/runtime/{ => extra}/contrib/cutlass/fp16_group_gemm_sm100.cu (100%)
rename src/runtime/{ => extra}/contrib/cutlass/fp16_group_gemm_sm90.cu (100%)
rename src/runtime/{ => extra}/contrib/cutlass/fp8_gemm.cu (100%)
rename src/runtime/{ => extra}/contrib/cutlass/fp8_group_gemm_sm90.cu (100%)
rename src/runtime/{ => extra}/contrib/cutlass/fp8_groupwise_scaled_gemm.cuh
(100%)
rename src/runtime/{ =>
extra}/contrib/cutlass/fp8_groupwise_scaled_gemm_runner_sm100.cuh (99%)
rename src/runtime/{ =>
extra}/contrib/cutlass/fp8_groupwise_scaled_gemm_runner_sm90.cuh (99%)
rename src/runtime/{ =>
extra}/contrib/cutlass/fp8_groupwise_scaled_gemm_sm100.cu (100%)
rename src/runtime/{ =>
extra}/contrib/cutlass/fp8_groupwise_scaled_gemm_sm90.cu (100%)
rename src/runtime/{ =>
extra}/contrib/cutlass/fp8_groupwise_scaled_group_gemm_runner_sm100.cuh (99%)
rename src/runtime/{ =>
extra}/contrib/cutlass/fp8_groupwise_scaled_group_gemm_sm100.cu (100%)
rename src/runtime/{ => extra}/contrib/cutlass/gemm_runner.cuh (99%)
rename src/runtime/{ => extra}/contrib/cutlass/weight_preprocess.cc (100%)
rename src/runtime/{ => extra}/contrib/dnnl/dnnl.cc (100%)
rename src/runtime/{ => extra}/contrib/dnnl/dnnl_json_runtime.cc (95%)
rename src/runtime/{ => extra}/contrib/dnnl/dnnl_kernel.h (100%)
rename src/runtime/{ => extra}/contrib/dnnl/dnnl_tensor_requisite.h (100%)
rename src/runtime/{ => extra}/contrib/dnnl/dnnl_utils.cc (100%)
rename src/runtime/{ => extra}/contrib/dnnl/dnnl_utils.h (100%)
rename src/runtime/{ => extra}/contrib/example_npu/example_npu_runtime.cc
(100%)
rename src/runtime/{ => extra}/contrib/hipblas/hipblas.cc (99%)
rename src/runtime/{ => extra}/contrib/hipblas/hipblas_json_runtime.cc (99%)
rename src/runtime/{ => extra}/contrib/hipblas/hipblas_utils.cc (98%)
rename src/runtime/{ => extra}/contrib/hipblas/hipblas_utils.h (100%)
rename src/runtime/{ => extra}/contrib/json/json_node.h (100%)
rename src/runtime/{ => extra}/contrib/json/json_runtime.h (99%)
rename src/runtime/{ => extra}/contrib/nnapi/nnapi_builder.cc (100%)
rename src/runtime/{ => extra}/contrib/nnapi/nnapi_builder.h (100%)
rename src/runtime/{ => extra}/contrib/nnapi/nnapi_ops.cc (100%)
rename src/runtime/{ => extra}/contrib/nnapi/nnapi_ops.h (100%)
rename src/runtime/{ => extra}/contrib/nnapi/nnapi_runtime.cc (100%)
rename src/runtime/{ => extra}/contrib/nvshmem/dist_gemm.cu (99%)
rename src/runtime/{ => extra}/contrib/nvshmem/init.cc (99%)
rename src/runtime/{ => extra}/contrib/nvshmem/kv_transfer.cu (100%)
rename src/runtime/{ => extra}/contrib/nvshmem/memory_allocator.cc (97%)
rename src/runtime/{ => extra}/contrib/random/mt_random_engine.cc (100%)
rename src/runtime/{ => extra}/contrib/random/random.cc (100%)
rename src/runtime/{ => extra}/contrib/sort/sort.cc (99%)
rename src/runtime/{ => extra}/contrib/tensorrt/tensorrt_builder.cc (100%)
rename src/runtime/{ => extra}/contrib/tensorrt/tensorrt_builder.h (100%)
rename src/runtime/{ => extra}/contrib/tensorrt/tensorrt_calibrator.h (99%)
rename src/runtime/{ => extra}/contrib/tensorrt/tensorrt_logger.h (100%)
rename src/runtime/{ => extra}/contrib/tensorrt/tensorrt_ops.cc (100%)
rename src/runtime/{ => extra}/contrib/tensorrt/tensorrt_ops.h (100%)
rename src/runtime/{ => extra}/contrib/tensorrt/tensorrt_runtime.cc (99%)
rename src/runtime/{ => extra}/contrib/tensorrt/tensorrt_utils.h (100%)
rename src/runtime/{ => extra}/contrib/thrust/thrust.cu (99%)
rename src/runtime/{ => extra}/contrib/vllm/attention_kernels.cu (100%)
rename src/runtime/{ => extra}/contrib/vllm/attention_utils.cuh (100%)
rename src/runtime/{ => extra}/contrib/vllm/cache_alloc.cc (100%)
rename src/runtime/{ => extra}/contrib/vllm/cache_kernels.cu (100%)
rename src/runtime/{ => extra}/contrib/vllm/dtype_float16.h (100%)
rename src/runtime/{ => extra}/disco/bcast_session.cc (100%)
rename src/runtime/{ => extra}/disco/bcast_session.h (100%)
rename src/runtime/{ => extra}/disco/builtin.cc (100%)
rename src/runtime/{ => extra}/disco/cuda_ipc/cuda_ipc_memory.cc (98%)
rename src/runtime/{ => extra}/disco/cuda_ipc/custom_allreduce.cc (98%)
rename src/runtime/{ => extra}/disco/disco_worker.cc (99%)
rename src/runtime/{ => extra}/disco/disco_worker_thread.h (100%)
rename src/runtime/{ => extra}/disco/distributed/socket_session.cc (99%)
rename src/runtime/{ => extra}/disco/loader.cc (99%)
rename src/runtime/{ => extra}/disco/message_queue.h (100%)
rename src/runtime/{ => extra}/disco/nccl/nccl.cc (99%)
rename src/runtime/{ => extra}/disco/nccl/nccl_context.h (97%)
rename src/runtime/{ => extra}/disco/process_session.cc (98%)
rename src/runtime/{ => extra}/disco/protocol.h (98%)
rename src/runtime/{ => extra}/disco/session.cc (100%)
rename src/runtime/{ => extra}/disco/threaded_session.cc (98%)
rename src/runtime/{ => extra}/disco/utils.h (100%)
delete mode 100644 src/runtime/meta_data.h
delete mode 100644 src/runtime/nvtx.cc
rename src/runtime/{ => opencl}/texture.h (97%)
delete mode 100644 src/runtime/regex.cc
delete mode 100644 src/runtime/regex.h
rename src/runtime/{ => rpc}/minrpc/minrpc_server.h (100%)
rename src/runtime/{ => rpc}/minrpc/posix_popen_server/posix_popen_server.cc
(100%)
rename src/runtime/{ => rpc}/minrpc/rpc_reference.h (100%)
rename src/runtime/{ => vulkan}/thread_map.h (97%)
delete mode 100644 src/tirx/transform/replace_global_vars.cc
delete mode 100644 tests/python/ir/test_transform_replace_global_var.py