@@ -1572,33 +1572,33 @@ void llm_graph_context::build_pooling(
1572
1572
ggml_tensor * inp_cls = build_inp_cls ();
1573
1573
inp = ggml_get_rows (ctx0, inp, inp_cls);
1574
1574
1575
- if (cls != nullptr ) {
1575
+ if (cls) {
1576
1576
// classification head
1577
1577
// https://github.com/huggingface/transformers/blob/5af7d41e49bbfc8319f462eb45253dcb3863dfb7/src/transformers/models/roberta/modeling_roberta.py#L1566
1578
1578
cur = ggml_mul_mat (ctx0, cls, inp);
1579
- if (cls_b != nullptr ) {
1579
+ if (cls_b) {
1580
1580
cur = ggml_add (ctx0, cur, cls_b);
1581
1581
}
1582
1582
cur = ggml_tanh (ctx0, cur);
1583
1583
1584
1584
if (cls_norm) {
1585
1585
// normalization head
1586
- cur = build_norm (cur, cls_norm, nullptr , LLM_NORM, 0 );
1586
+ cur = build_norm (cur, cls_norm, NULL , LLM_NORM, - 1 );
1587
1587
}
1588
1588
1589
1589
// some models don't have `cls_out`, for example: https://huggingface.co/jinaai/jina-reranker-v1-tiny-en
1590
1590
// https://huggingface.co/jinaai/jina-reranker-v1-tiny-en/blob/cb5347e43979c3084a890e3f99491952603ae1b7/modeling_bert.py#L884-L896
1591
1591
if (cls_out) {
1592
1592
cur = ggml_mul_mat (ctx0, cls_out, cur);
1593
- if (cls_out_b != nullptr ) {
1593
+ if (cls_out_b) {
1594
1594
cur = ggml_add (ctx0, cur, cls_out_b);
1595
1595
}
1596
1596
}
1597
1597
} else if (cls_out) {
1598
1598
// Single layer classification head (direct projection)
1599
1599
// https://github.com/huggingface/transformers/blob/f4fc42216cd56ab6b68270bf80d811614d8d59e4/src/transformers/models/bert/modeling_bert.py#L1476
1600
1600
cur = ggml_mul_mat (ctx0, cls_out, inp);
1601
- if (cls_out_b != nullptr ) {
1601
+ if (cls_out_b) {
1602
1602
cur = ggml_add (ctx0, cur, cls_out_b);
1603
1603
}
1604
1604
} else {
0 commit comments