Skip to content

Commit 1a66f9f

Browse files
authored
fix: Fix problem using ops.ones in BigBird (#1861)
1 parent e56d096 commit 1a66f9f

File tree

2 files changed

+8
-8
lines changed

2 files changed

+8
-8
lines changed

mindnlp/transformers/models/big_bird/modeling_big_bird.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -470,13 +470,13 @@ def bigbird_block_sparse_attention(
470470
[
471471
to_mask[:, :, :, : 3 * to_block_size],
472472
to_mask[:, :, :, -to_block_size:],
473-
ops.ones([bsz, 1, 1, n_rand_blocks * to_block_size], dtype=to_mask.dtype),
473+
ops.ones((bsz, 1, 1, n_rand_blocks * to_block_size), dtype=to_mask.dtype),
474474
],
475475
dim=3,
476476
)
477477
second_rand_pad = ops.cat(
478478
[
479-
ops.ones([bsz, n_heads, from_block_size, 4 * to_block_size], dtype=rand_mask.dtype),
479+
ops.ones((bsz, n_heads, from_block_size, 4 * to_block_size), dtype=rand_mask.dtype),
480480
rand_mask[:, :, 0],
481481
],
482482
dim=3,
@@ -604,13 +604,13 @@ def bigbird_block_sparse_attention(
604604
[
605605
to_mask[:, :, :, :to_block_size],
606606
to_mask[:, :, :, -3 * to_block_size :],
607-
ops.ones([bsz, 1, 1, n_rand_blocks * to_block_size], dtype=to_mask.dtype),
607+
ops.ones((bsz, 1, 1, n_rand_blocks * to_block_size), dtype=to_mask.dtype),
608608
],
609609
dim=3,
610610
)
611611
second_last_rand_pad = ops.cat(
612612
[
613-
ops.ones([bsz, n_heads, from_block_size, 4 * to_block_size], dtype=rand_mask.dtype),
613+
ops.ones((bsz, n_heads, from_block_size, 4 * to_block_size), dtype=rand_mask.dtype),
614614
rand_mask[:, :, -1],
615615
],
616616
dim=3,

mindnlp/transformers/models/bigbird_pegasus/modeling_bigbird_pegasus.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -450,13 +450,13 @@ def bigbird_block_sparse_attention(
450450
[
451451
to_mask[:, :, :, : 3 * to_block_size],
452452
to_mask[:, :, :, -to_block_size:],
453-
ops.ones([bsz, 1, 1, n_rand_blocks * to_block_size], dtype=to_mask.dtype),
453+
ops.ones((bsz, 1, 1, n_rand_blocks * to_block_size), dtype=to_mask.dtype),
454454
],
455455
dim=3,
456456
)
457457
second_rand_pad = ops.cat(
458458
[
459-
ops.ones([bsz, n_heads, from_block_size, 4 * to_block_size], dtype=rand_mask.dtype),
459+
ops.ones((bsz, n_heads, from_block_size, 4 * to_block_size), dtype=rand_mask.dtype),
460460
rand_mask[:, :, 0],
461461
],
462462
dim=3,
@@ -584,13 +584,13 @@ def bigbird_block_sparse_attention(
584584
[
585585
to_mask[:, :, :, :to_block_size],
586586
to_mask[:, :, :, -3 * to_block_size :],
587-
ops.ones([bsz, 1, 1, n_rand_blocks * to_block_size], dtype=to_mask.dtype),
587+
ops.ones((bsz, 1, 1, n_rand_blocks * to_block_size), dtype=to_mask.dtype),
588588
],
589589
dim=3,
590590
)
591591
second_last_rand_pad = ops.cat(
592592
[
593-
ops.ones([bsz, n_heads, from_block_size, 4 * to_block_size], dtype=rand_mask.dtype),
593+
ops.ones((bsz, n_heads, from_block_size, 4 * to_block_size), dtype=rand_mask.dtype),
594594
rand_mask[:, :, -1],
595595
],
596596
dim=3,

0 commit comments

Comments
 (0)