Bert的简单使用

最新推荐文章于 2025-05-10 20:44:16 发布

原创最新推荐文章于 2025-05-10 20:44:16 发布 · 546 阅读

1 ·

CC 4.0 BY-SA版权

python编程同时被 2 个专栏收录

139 篇文章

订阅专栏

pytorch

47 篇文章

订阅专栏

本文介绍了一个简单的BERT模型使用案例，展示了如何将文本输入转化为向量表示，并将输出的矩阵保存到文件中。通过实例，文章详细说明了BERT模型的输入准备、调用及输出处理过程。

摘要生成于 C知道，由 DeepSeek-R1 满血版支持，前往体验 >

简单使用了一下Bert，并输出对应的矩阵到文件中。

import torch
from transformers import BertConfig, BertModel, BertTokenizer

def bert_output(texts, name):#texts包含三句话
    tokens, segments, input_masks =[], [], []
    for text in texts:
        tokenized_text = tokenizer.tokenize(text)
        indexed_tokens = tokenizer.convert_tokens_to_ids(tokenized_text)
        tokens.append(indexed_tokens)
        segments.append( [0]*len(indexed_tokens) )
        input_masks.append( [1]*len(indexed_tokens) )

    max_len = max([len(single) for single in tokens])  # 最大的句子长度

    for j in range(len(tokens)):
        padding = [0] * (max_len - len(tokens[j]))
        padding_other = [1] * (max_len - len(tokens[j]))
        tokens[j] += padding
        segments[j] += padding
        input_masks[j] += padding_other

    # device = torch.cuda.current_device()

    tokens_tensor = torch.tensor(tokens)
    segments_tensors = torch.tensor(segments)
    input_masks_tensors = torch.tensor(input_masks)

    # output = model(tokens_tensor)
    output = model(tokens_tensor, segments_tensors, input_masks_tensors)
    sequence_output = output[0]
    pooled_output = output[1] # CLS
    torch.set_printoptions(edgeitems=768)#矩阵全部显示，不隐藏

    with open(name, 'a', encoding='utf-8') as f:
        # f.write("sequence_output:")
        # f.write(str(sequence_output))
        # f.write('\n')
        f.write("pooled_output:")
        f.write(str(pooled_output))
    # return pooled_output,sequence_output#输出CLS、与其他向量

if __name__ == '__main__':
    tokenizer = BertTokenizer.from_pretrained('./bert-base-uncased')
    model_config = BertConfig.from_pretrained('./bert-base-uncased')#model_config.hidden_size=768
    model = BertModel.from_pretrained('./bert-base-uncased',config=model_config)


    texts_atis =  ["[CLS] i want to fly from baltimore to dallas round trip [SEP]",
                   "[CLS] show me the flights arriving baltimore on june fourteenth [SEP]",
                   "[CLS] which airlines fly from boston to washington via other cities [SEP]"]
    texts_snips = ["[CLS] what the weather in my current spot the [SEP]",
                   "[CLS] what the weather like in the city frewen [SEP]",
                   "[CLS] what the weather supposed to be like today [SEP]"]
    # texts_snips = ["[CLS] what the weather supposed to be like today [SEP]"]

    atis = 'atis.txt'
    snips = 'snips.txt'

    bert_output(texts_snips, snips)
    #bert输出向量CLS+others
    #atis_out_CLS,atis_out_others = bert_output(texts_atis, atis)#CLS二维矩阵，other三维矩阵