Skip to content

random sample算子太初平台 #169

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 3 commits into
base: teco
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
48 changes: 21 additions & 27 deletions operatorspy/tests/random_sample.py
Original file line number Diff line number Diff line change
Expand Up @@ -31,47 +31,32 @@ class RandomSampleDescriptor(Structure):

def random_sample(data, random_val, topp, topk, voc, temperature, torch_device):
indices = torch.zeros([topk], dtype = torch.int64)
dataNp = data.clone().detach()
sorted_indices = torch.arange(voc)

for i in range(topk):
for j in range(i + 1, voc):
if(dataNp[i] < dataNp[j]):
tmp = dataNp[i].clone().detach()
dataNp[i] = dataNp[j].clone().detach()
dataNp[j] = tmp

tmpInd = sorted_indices[i].clone().detach()
sorted_indices[i] = sorted_indices[j].clone().detach()
sorted_indices[j] = tmpInd
dataNp = data.clone()

#sorted_indices = torch.argsort(dataNp, descending=True)
sorted_indices = torch.argsort(dataNp, descending=True)
indices = sorted_indices[:topk]

dataNp = dataNp[sorted_indices]

globalM = dataNp[0]
dataNp = (dataNp - globalM) / temperature
dataNp = torch.softmax(dataNp.float(), dim = 0)
sum_s = 0

for i in range(1, topk):
dataNp[i] = dataNp[i] + dataNp[i - 1]

for end in range(topk):
sum_s += dataNp[end]
if(sum_s >= topp):
if(dataNp[end] >= topp):
break
if(end < topk - 1):
end += 1
else:
end = topk

sum_s = 0
for i in range(end):
sum_s += dataNp[i]
random_val *= sum_s
random_val *= dataNp[end - 1]

sum_s = 0
for i in range(end):
sum_s += dataNp[i]
if(random_val < sum_s):
if(random_val < dataNp[i]):
return indices[i]

def random_sample_0(data):
Expand Down Expand Up @@ -129,7 +114,7 @@ def test(lib, handle, torch_device, voc, random_val, topp, topk, temperature, x_
)
if torch_device == "npu":
torch.npu.synchronize()

assert indices[0].type(ans.dtype) == ans or data[ans] == data[indices[0]]
check_error(lib.infiniopDestroyRandomSampleDescriptor(descriptor))
print("Test passed!")
Expand Down Expand Up @@ -168,7 +153,13 @@ def test_ascend(lib, test_cases):
test(lib, handle, "npu", voc, random_val, topp, topk, temperature)
destroy_handle(lib, handle)


def test_teco(lib, test_cases):
import torch_sdaa
device = DeviceEnum.DEVICE_TECO
handle = create_handle(lib, device)
for (voc, random_val, topp, topk, temperature) in test_cases:
test(lib, handle, "sdaa", voc, random_val, topp, topk, temperature)
destroy_handle(lib, handle)

if __name__ == "__main__":
test_cases = [
Expand Down Expand Up @@ -224,6 +215,9 @@ def test_ascend(lib, test_cases):
test_bang(lib, test_cases)
if args.ascend:
test_ascend(lib, test_cases)
if not (args.cpu or args.cuda or args.bang or args.ascend):
if args.teco:
test_teco(lib, test_cases)

if not (args.cpu or args.cuda or args.bang or args.ascend or args.teco):
test_cpu(lib, test_cases)
print("\033[92mTest passed!\033[0m")
23 changes: 22 additions & 1 deletion src/ops/random_sample/operator.cc
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,9 @@
#ifdef ENABLE_ASCEND_NPU
#include "ascend/random_sample.h"
#endif
#ifdef ENABLE_TECO_SDAA
#include "teco/random_sample_teco.h"
#endif

__C infiniopStatus_t infiniopCreateRandomSampleDescriptor(infiniopHandle_t handle, infiniopRandomSampleDescriptor_t *desc_ptr, infiniopTensorDescriptor_t result, infiniopTensorDescriptor_t probs) {
switch (handle->device) {
Expand All @@ -35,8 +38,14 @@ __C infiniopStatus_t infiniopCreateRandomSampleDescriptor(infiniopHandle_t handl
#ifdef ENABLE_ASCEND_NPU
case DevAscendNpu: {
return ascendCreateRandomSampleDescriptor((AscendHandle_t) handle,
(RandomSampleAscendDescriptor_t *) desc_ptr, result, probs);
(RandomSampleAscendDescriptor_t *) desc_ptr, result, probs);
}
#endif
#ifdef ENABLE_TECO_SDAA
case DevTecoSDAA:
return tecoCreateRandomSampleDescriptor((TecoHandle_t) handle,
(RandomSampleTecoDescriptor_t *) desc_ptr, result, probs);
;
#endif
}
return STATUS_BAD_DEVICE;
Expand Down Expand Up @@ -64,6 +73,10 @@ __C infiniopStatus_t infiniopGetRandomSampleWorkspaceSize(infiniopRandomSampleDe
case DevAscendNpu: {
return ascendGetRandomSampleWorkspaceSize((RandomSampleAscendDescriptor_t) desc, size);
}
#endif
#ifdef ENABLE_TECO_SDAA
case DevTecoSDAA:
return tecoGetRandomSampleWorkspaceSize((RandomSampleTecoDescriptor_t) desc, size);
#endif
}
return STATUS_BAD_DEVICE;
Expand Down Expand Up @@ -97,6 +110,10 @@ __C infiniopStatus_t infiniopRandomSample(infiniopRandomSampleDescriptor_t desc,
case DevAscendNpu: {
return ascendRandomSample((RandomSampleAscendDescriptor_t) desc, workspace, workspace_size, result, probs, random_val, topp, topk, temperature, stream);
}
#endif
#ifdef ENABLE_TECO_SDAA
case DevTecoSDAA:
return tecoRandomSample((RandomSampleTecoDescriptor_t) desc, workspace, workspace_size, result, probs, random_val, topp, topk, temperature, stream);
#endif
}
return STATUS_BAD_DEVICE;
Expand All @@ -121,6 +138,10 @@ __C infiniopStatus_t infiniopDestroyRandomSampleDescriptor(infiniopRandomSampleD
case DevAscendNpu: {
return ascendDestroyRandomSampleDescriptor((RandomSampleAscendDescriptor_t) desc);
}
#endif
#ifdef ENABLE_TECO_SDAA
case DevTecoSDAA:
return tecoDestroyRandomSampleDescriptor((RandomSampleTecoDescriptor_t) desc);
#endif
}
return STATUS_BAD_DEVICE;
Expand Down
42 changes: 42 additions & 0 deletions src/ops/random_sample/teco/random_sample_teco.h
Original file line number Diff line number Diff line change
@@ -0,0 +1,42 @@
#ifndef __SDAA_RANDOM_SAMPLE_H__
#define __SDAA_RANDOM_SAMPLE_H__

#include "../../../devices/teco/teco_handle.h"
#include "../../utils.h"
#include "operators.h"
#include <sdaa_runtime.h>

struct RandomSampleTecoDescriptor {
Device device;
int device_id;
tecodnnHandle_t handle;
sdaaStream_t stream;
DT dtype;
int voc;
DT rDtype;
int rLength;
};

typedef struct RandomSampleTecoDescriptor *RandomSampleTecoDescriptor_t;

infiniopStatus_t tecoCreateRandomSampleDescriptor(TecoHandle_t handle,
RandomSampleTecoDescriptor_t *desc_ptr, infiniopTensorDescriptor_t result,
infiniopTensorDescriptor_t probs);

infiniopStatus_t tecoGetRandomSampleWorkspaceSize(RandomSampleTecoDescriptor_t desc, uint64_t *size);

infiniopStatus_t tecoRandomSample(RandomSampleTecoDescriptor_t desc,
void *workspace,
uint64_t workspace_size,
void *result,
void const *probs,
float random_val,
float topp,
int topk,
float temperature,
void *stream);

infiniopStatus_t tecoDestroyRandomSampleDescriptor(RandomSampleTecoDescriptor_t desc);


#endif
Loading