Skip to content

Commit

Permalink
1
Browse files Browse the repository at this point in the history
  • Loading branch information
Your Name committed May 31, 2024
1 parent 0ce98ba commit fc45c3b
Showing 1 changed file with 0 additions and 20 deletions.
20 changes: 0 additions & 20 deletions vllm/model_executor/layers/fused_moe/ampere_fp8_fused_moe.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,8 +4,6 @@
import json
import os
from typing import Any, Dict, Optional, Tuple, Callable
import pkg_resources
import shutil

import torch
import triton
Expand All @@ -18,24 +16,6 @@
logger = init_logger(__name__)


def replace_triton_cuda():

def get_package_path(package_name):
return pkg_resources.get_distribution(package_name).location

def get_package_version(package_name):
return pkg_resources.get_distribution(package_name).version

assert get_package_version('triton') == "2.2.0"

cur_folder_cuda_py = os.path.join(os.path.dirname(os.path.abspath(__file__)), 'triton_cuda.py')
target_folder_cuda_py = os.path.join(get_package_path('triton'), 'triton', 'language', 'extra', 'cuda.py')
shutil.copyfile(cur_folder_cuda_py, target_folder_cuda_py)


replace_triton_cuda()


@triton.jit
def fused_moe_kernel(
# Pointers to matrices
Expand Down

0 comments on commit fc45c3b

Please sign in to comment.