kernels-community
/

megablocks

Model card Files Files and versions

megablocks / build /torch28-cxx11-cu129-x86_64-linux /ops /padded_gather.py

danieldk's picture

danieldk HF Staff

Revert "Build uploaded using `kernels`."

83c6859 5 months ago

History Blame Contribute Delete

1.26 kB

	# Copyright 2024 Databricks
	# SPDX-License-Identifier: Apache-2.0
	from typing import Any

	import torch
	from .stk_autocast import custom_bwd, custom_fwd

	from ..backend import kernels


	# Autograd wrapper for padded_gather kernel.
	class PaddedGatherOp(torch.autograd.Function):

	@staticmethod
	@custom_fwd
	def forward(
	ctx: Any,
	x: torch.Tensor,
	indices: torch.Tensor,
	bin_ids: torch.Tensor,
	bins: torch.Tensor,
	padded_bins: torch.Tensor,
	top_k: int,
	):
	ctx.save_for_backward(indices, bin_ids, bins, padded_bins)
	ctx.top_k = top_k
	return kernels.padded_gather(
	x,
	indices,
	bin_ids,
	None,
	bins,
	padded_bins,
	top_k,
	)

	@staticmethod
	@custom_bwd
	def backward(ctx: Any, grad: torch.Tensor):
	grad = grad.contiguous()

	indices, bin_ids, bins, padded_bins = ctx.saved_tensors
	out = kernels.padded_scatter(
	grad,
	indices,
	bin_ids,
	None,
	bins,
	padded_bins,
	ctx.top_k,
	)
	return out, None, None, None, None, None


	padded_gather = PaddedGatherOp.apply