路透社reuters话题分类
来自路透社的11,228条新闻数据集标有46个主题。与IMDB数据集一样,每条线都被编码为一系列字索引。
reuters数据集无法下载,详见本篇博客提供下载和使用:
https://blog.youkuaiyun.com/sinat_41144773/article/details/89843688
代码实现
from keras.datasets import reuters
from keras.utils.np_utils import to_categorical
from keras import models
from keras.layers import LSTM
from keras.layers import Dense,Embedding
import numpy as np
import matplotlib.pyplot as plt
from keras.optimizers import Adam,RMSprop
from sklearn.metrics import confusion_matrix, f1_score, precision_score, recall_score,accuracy_score
# 获取数据
(train_data, train_labels), (test_data, test_labels) = reuters.load_data(num_words=8000)
# vectorized sequences
def vectorize_sequences(sequences, dimension=8000):
results = n