import sys import re import urllib2 def getTitle( url ): user_agent = "Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident/4.0; .NET CLR 2.0.50727; .NET CLR 3.0.4506.2152; .NET CLR 3.5.30729)" req = urllib2.Request(url) req.add_header("User-agent", user_agent) response = urllib2.urlopen(req) headers = response.info().headers contents = response.readlines() output = [] for line in contents: searchRegex = re.search("([^<]+) ", line) if searchRegex : output.append(searchRegex.group(1)) return output def main(argv): exportFilePath = str(argv[1]) exportFilePath.strip() url = "http://npteam.net/rss" titles = getTitle( url ) f = file(exportFilePath, 'w') for line in titles: f.write(line + "\r\n") f.close() if __name__ == "__main__": try: main(argv=sys.argv) except os.error, err: print str(err)
[Python] RSS에서 title 내용만 가져오기
프로그래밍/Python
2013/03/20 19:41
RSS 내용중에서 title 내용을 가져오기 위한 간단한 소스 코드입니다.
덧글을 달아 주세요