python+Xpath爬取英文新闻并生成文档词频矩阵
1.爬取新华网Business - Finance类别的新闻url
import requests
import json
from selenium import webdriver
from lxml import etree
import time
import os
import pandas as pd
import numpy as np
import re
import nlt...
原创
2018-05-15 17:10:44 ·
3183 阅读 ·
1 评论