diff --git a/kernel_meta/kernel_meta_2003868091326117548/kernel_meta/te_notequal_364c7d0e50b7d3e1ee53996fddce4437fed02e4179bde64476c998236ae04c0e_1.json b/kernel_meta/kernel_meta_2003868091326117548/kernel_meta/te_notequal_364c7d0e50b7d3e1ee53996fddce4437fed02e4179bde64476c998236ae04c0e_1.json new file mode 100644 index 000000000..e575427da --- /dev/null +++ b/kernel_meta/kernel_meta_2003868091326117548/kernel_meta/te_notequal_364c7d0e50b7d3e1ee53996fddce4437fed02e4179bde64476c998236ae04c0e_1.json @@ -0,0 +1,19 @@ +{ + "KBHit":false, + "binFileName":"te_notequal_364c7d0e50b7d3e1ee53996fddce4437fed02e4179bde64476c998236ae04c0e_1", + "binFileSuffix":".o", + "blockDim":1, + "coreType":"VectorCore", + "deterministic":"ignore", + "intercoreSync":0, + "kernelName":"te_notequal_364c7d0e50b7d3e1ee53996fddce4437fed02e4179bde64476c998236ae04c0e_1__kernel0", + "magic":"RT_DEV_BINARY_MAGIC_ELF_AIVEC", + "memoryStamping":[], + "opParaSize":0, + "parameters":[ + null, + null, + null + ], + "sha256":"0463850c6323ea4c82f765616710ef1dfcb60ffff1ac1ddc3f41e89288c8d28a" +} \ No newline at end of file diff --git a/kernel_meta/kernel_meta_2003868091326117548/kernel_meta/te_notequal_364c7d0e50b7d3e1ee53996fddce4437fed02e4179bde64476c998236ae04c0e_1.o b/kernel_meta/kernel_meta_2003868091326117548/kernel_meta/te_notequal_364c7d0e50b7d3e1ee53996fddce4437fed02e4179bde64476c998236ae04c0e_1.o new file mode 100644 index 000000000..f054e3c87 Binary files /dev/null and b/kernel_meta/kernel_meta_2003868091326117548/kernel_meta/te_notequal_364c7d0e50b7d3e1ee53996fddce4437fed02e4179bde64476c998236ae04c0e_1.o differ diff --git a/kernel_meta_temp_16274467486236309844/buildPidInfo.json b/kernel_meta_temp_16274467486236309844/buildPidInfo.json new file mode 100644 index 000000000..87d734034 --- /dev/null +++ b/kernel_meta_temp_16274467486236309844/buildPidInfo.json @@ -0,0 +1,6 @@ +[ + [ + 3439890, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_4302799503727008734" + ] +] \ No newline at end of file diff --git a/kernel_meta_temp_17044593291566822053/buildPidInfo.json b/kernel_meta_temp_17044593291566822053/buildPidInfo.json new file mode 100644 index 000000000..077bc1654 --- /dev/null +++ b/kernel_meta_temp_17044593291566822053/buildPidInfo.json @@ -0,0 +1,6 @@ +[ + [ + 419546, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_10595876705721420016" + ] +] \ No newline at end of file diff --git a/kernel_meta_temp_17393875604103931/buildPidInfo.json b/kernel_meta_temp_17393875604103931/buildPidInfo.json new file mode 100644 index 000000000..d7bfd22d7 --- /dev/null +++ b/kernel_meta_temp_17393875604103931/buildPidInfo.json @@ -0,0 +1,130 @@ +[ + [ + 730815, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_17438986247853928722" + ], + [ + 748121, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_9042571282781501195" + ], + [ + 772931, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_13561603852611107281" + ], + [ + 962160, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_17652122168333968458" + ], + [ + 992078, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_8328069733520576387" + ], + [ + 1024724, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_10852159473492996615" + ], + [ + 1052747, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_1965741910731265513" + ], + [ + 1063905, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_9951644031148627187" + ], + [ + 1095958, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_9977857833561060082" + ], + [ + 1114789, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_2798749991041415536" + ], + [ + 1136177, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_10226972389373224560" + ], + [ + 1165202, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_1083703252434699971" + ], + [ + 1168170, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_4031511101427731290" + ], + [ + 1174449, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_18209585249912247408" + ], + [ + 1176862, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_2091761881164873326" + ], + [ + 1186624, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_7349939208149454905" + ], + [ + 1203662, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_12443456610341136723" + ], + [ + 1205685, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_15334538486333168998" + ], + [ + 1211956, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_6723213923785905412" + ], + [ + 1222952, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_15853831961758292114" + ], + [ + 1227416, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_2852566461672193937" + ], + [ + 1233286, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_17167099510868149006" + ], + [ + 1274390, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_11390322069969700060" + ], + [ + 1289989, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_9683260956464187754" + ], + [ + 1292609, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_13344674103348759168" + ], + [ + 1294263, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_1401687578104008397" + ], + [ + 1297275, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_9340049039727419272" + ], + [ + 1299101, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_4270614156502846006" + ], + [ + 1300952, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_15708884068586704614" + ], + [ + 1315681, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_9882675287703648155" + ], + [ + 1328969, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_15240988205801878635" + ], + [ + 1373305, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_16316567712180939426" + ] +] \ No newline at end of file diff --git a/kernel_meta_temp_3685030010405750619/buildPidInfo.json b/kernel_meta_temp_3685030010405750619/buildPidInfo.json new file mode 100644 index 000000000..b9777ab5d --- /dev/null +++ b/kernel_meta_temp_3685030010405750619/buildPidInfo.json @@ -0,0 +1,6 @@ +[ + [ + 1634988, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_987714910372939987" + ] +] \ No newline at end of file diff --git a/kernel_meta_temp_6263103544429038229/buildPidInfo.json b/kernel_meta_temp_6263103544429038229/buildPidInfo.json new file mode 100644 index 000000000..f826c98a9 --- /dev/null +++ b/kernel_meta_temp_6263103544429038229/buildPidInfo.json @@ -0,0 +1,26 @@ +[ + [ + 1278012, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_11398586797771384334" + ], + [ + 1309696, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_13868717514186821465" + ], + [ + 1317392, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_13299477596528331129" + ], + [ + 1473626, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_2003868091326117548" + ], + [ + 1538757, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_3816004234326890543" + ], + [ + 2027226, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_13875673836168841592" + ] +] \ No newline at end of file diff --git a/kernel_meta_temp_6263103544429038229/task_pid_1473626_1479641.txt b/kernel_meta_temp_6263103544429038229/task_pid_1473626_1479641.txt new file mode 100644 index 000000000..85c6a62bc --- /dev/null +++ b/kernel_meta_temp_6263103544429038229/task_pid_1473626_1479641.txt @@ -0,0 +1 @@ +281471747027232.124 diff --git a/kernel_meta_temp_6803255206518235934/buildPidInfo.json b/kernel_meta_temp_6803255206518235934/buildPidInfo.json new file mode 100644 index 000000000..fc89bbdcc --- /dev/null +++ b/kernel_meta_temp_6803255206518235934/buildPidInfo.json @@ -0,0 +1,158 @@ +[ + [ + 1665635, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_2070681248079114431" + ], + [ + 1669243, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_15972988884021768035" + ], + [ + 1671735, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_14462458265164730148" + ], + [ + 1698537, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_7714407451463426009" + ], + [ + 1732162, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_8093432001578936120" + ], + [ + 1751907, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_13495005174825000525" + ], + [ + 1767034, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_1148414944764641249" + ], + [ + 1770476, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_4593780200289858929" + ], + [ + 1777271, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_8999278063834901484" + ], + [ + 1795613, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_4057774841895083283" + ], + [ + 1799060, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_254490910956240413" + ], + [ + 1800556, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_1304679340362438230" + ], + [ + 1808401, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_7705012627620895413" + ], + [ + 1811425, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_9212000814920849058" + ], + [ + 1817569, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_2535118358430474166" + ], + [ + 1831958, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_15852957858253228207" + ], + [ + 1836101, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_16065293264588911878" + ], + [ + 1847206, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_10428916002563314800" + ], + [ + 1852046, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_3462605367797933820" + ], + [ + 1856753, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_6173152488185473017" + ], + [ + 1858576, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_6438249594721386150" + ], + [ + 1861139, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_5599408892120233732" + ], + [ + 1862920, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_5127044358392781462" + ], + [ + 1864354, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_1648987811990508290" + ], + [ + 1866564, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_15720643386659449480" + ], + [ + 1885545, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_3435037455676822346" + ], + [ + 1887062, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_970417178506262714" + ], + [ + 1908947, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_15337059914871875866" + ], + [ + 1910288, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_18195933536594227160" + ], + [ + 1912014, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_10294805498921314753" + ], + [ + 1913228, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_7616616554817270553" + ], + [ + 1914684, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_8597952330701423880" + ], + [ + 1917448, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_8681966603034129951" + ], + [ + 1921635, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_12076566523787540173" + ], + [ + 1961161, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_14361218754409734998" + ], + [ + 1970433, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_17131376246755817590" + ], + [ + 2023297, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_14159057209005041734" + ], + [ + 2025901, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_13914545232858777416" + ], + [ + 2027529, + "/data1/home/zengqunhong/libai/kernel_meta/kernel_meta_3799579533752641357" + ] +] \ No newline at end of file diff --git a/rep.py b/rep.py new file mode 100644 index 000000000..1637eceee --- /dev/null +++ b/rep.py @@ -0,0 +1,6 @@ +import oneflow as flow +import oneflow_npu + +ids = flow.tensor([1, 2, 3, 4], dtype=flow.int64, device="npu") +t = flow.tensor([1, 2, 0, 4], dtype=flow.int64, device="npu") +print(t == ids) \ No newline at end of file diff --git a/test_cmask.py b/test_cmask.py new file mode 100644 index 000000000..37ff0baf0 --- /dev/null +++ b/test_cmask.py @@ -0,0 +1,83 @@ +import oneflow as flow +import oneflow_npu +from oneflow import nn +from libai.utils import distributed as dist + + +class CasualMask(nn.Module): + def __init__(self, max_positions=1024, dtype=flow.float16, *, layer_idx=0): + super().__init__() + self.dtype = dtype + self.mask = flow.full( + (max_positions, max_positions), + flow.finfo(dtype).min, + placement=dist.get_layer_placement(layer_idx), + sbp=dist.get_nd_sbp([flow.sbp.broadcast, flow.sbp.broadcast]), + ) + matrix = flow.ones( + (self.mask.size(-1), self.mask.size(-1)), + dtype=flow.bool, + placement=dist.get_layer_placement(layer_idx), + sbp=dist.get_nd_sbp([flow.sbp.broadcast, flow.sbp.broadcast]), + ) + upper_triangular_mask = flow.tril(matrix) + + self.mask.masked_fill_(upper_triangular_mask, 0) + self.mask = self.mask.to(dtype) + + def forward(self, input_ids, past_length=0, attention_mask=None, input_dtype=None): + bsz, tgt_len = input_ids.size() + casual_mask = self.mask[:tgt_len, :tgt_len] + if past_length > 0: + # in case past_key_values are used, we need to add a prefix ones mask to casual mask + casual_mask = flow.cat( + [flow.ones(tgt_len, past_length, dtype=self.dtype), casual_mask], dim=-1 + ) + casual_mask = ( + casual_mask.unsqueeze(0).unsqueeze(1).expand(bsz, 1, tgt_len, tgt_len + past_length) + ) + # casual_mask = casual_mask.to_global(sbp=input_ids.sbp) + # attention_mask = None # fix llama infer error + if attention_mask is not None: + bsz, src_len = attention_mask.size() + print(attention_mask) + attention_mask = ( + attention_mask[:, None, None, :] + .expand(bsz, 1, tgt_len, src_len) + .to(casual_mask.dtype) + ) + print(attention_mask) + attention_mask = attention_mask.to_global(placement=casual_mask.placement) + casual_mask = casual_mask + attention_mask + if input_dtype is not None: + casual_mask = casual_mask.to(input_dtype) + return casual_mask + + +m = CasualMask() +ids = flow.tensor( + [[1, 25538, 2211, 25562, 363, 7952, 292, 9045, 29891, 29889]], dtype=flow.long +) + +attent = flow.tensor( + [ + [ + 0.0000e00, + -3.4028e38, + 0.0000e00, + -3.4028e38, + 0.0000e00, + -3.4028e38, + 0.0000e00, + -3.4028e38, + 0.0000e00, + -3.4028e38, + ] + ], + dtype=flow.float32, + placement=dist.get_layer_placement(0), + sbp=dist.get_nd_sbp([flow.sbp.broadcast, flow.sbp.broadcast]), +) +print(attent.shape) +mask = m(ids, input_dtype=flow.float32, attention_mask=attent) +print(mask)