Python+Mecab
#!/usr/bin/env python# -*- coding: utf-8 -*-import reimport urllib2fp = urllib2.urlopen('http://www.yahoo.co.jp’)html = fp.read()fp.close()data = htmlp = re.compile(r'<.*?>')res= p.sub('', data)f = open('text.txt', 'w')f.write(res)f.close(…
#coding:utf-8import MeCabtagger = MeCab.Tagger("-Ochasen")result = tagger.parse("この記事はPythonの勉強メモです。")print result