From 0e6190f8ecf1053477c73c7448c82888e8acacac Mon Sep 17 00:00:00 2001 From: Mattias Andrée Date: Thu, 25 Jul 2013 11:15:58 +0200 Subject: fundamentals of parsing an xml file MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: Mattias Andrée --- src/featherweight.py | 46 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 46 insertions(+) create mode 100755 src/featherweight.py diff --git a/src/featherweight.py b/src/featherweight.py new file mode 100755 index 0000000..776fa49 --- /dev/null +++ b/src/featherweight.py @@ -0,0 +1,46 @@ +#!/usr/bin/env python3 +# -*- coding: utf-8 -*- +''' +featherweight – A lightweight terminal news feed reader + +Copyright © 2013 Mattias Andrée (maandree@member.fsf.org) + +This program is free software: you can redistribute it and/or modify +it under the terms of the GNU General Public License as published by +the Free Software Foundation, either version 3 of the License, or +(at your option) any later version. + +This program is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. + +You should have received a copy of the GNU General Public License +along with this program. If not, see . +''' +import xml.parsers.expat +import sys + + +rss = sys.argv[1] +with open(rss, 'r') as file: + rss = file.read() + + +parser = xml.parsers.expat.ParserCreate() + +def start_element(name, attributes): + print('Start element:', name, attributes) +def end_element(name): + print('End element:', name) +def char_data(data): + print('Character data:', repr(data)) + + +parser.StartElementHandler = start_element +parser.EndElementHandler = end_element +parser.CharacterDataHandler = char_data + + +parser.Parse(rss, True) + -- cgit v1.2.3-70-g09d2