# -*- coding: utf-8 -*- # # Copyright (C) 2015 lpschedule-generator contributors. See CONTRIBUTORS. # # This file is part of lpschedule-generator. # # lpschedule-generator is free software: you can redistribute it # and/or modify it under the terms of the GNU General Public License # as published by the Free Software Foundation, either version 3 of # the License, or (at your option) any later version. # # lpschedule-generator is distributed in the hope that it will be useful, but # WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU # General Public License for more details. # # You should have received a copy of the GNU General Public License # along with lpschedule-generator (see COPYING). If not, see # . import json import sys from argparse import ArgumentParser from collections import OrderedDict from os import path from bs4 import BeautifulSoup from jinja2 import Environment, FileSystemLoader from jinja2.exceptions import TemplateNotFound from mistune import Renderer, Markdown from unidecode import unidecode __version__ = '0.2.0' # unicode magic reload(sys) sys.setdefaultencoding('utf-8') # Python dictionary that will contain the lp schedule. lps_dict = OrderedDict() # Python dictionary that will contain the lp speakers. lpspeakers_dict = OrderedDict() def read_file(filename): """Read file and return it as a string. filename: Absolute pathname of the file. """ content = '' try: with open(filename, 'rb') as f: for line in f: content = content + line except IOError: print "Error: unable to open %s" % filename return content class LPSRenderer(Renderer): """Helps in converting Markdown version of LP schedule to a dictionary. """ def __init__(self, **kwargs): super(LPSRenderer, self).__init__(**kwargs) self.last_day = None self.last_time_slot = None self.last_session = None # Denotes the no. of the paragraph under a session; this # information will be helpful in identifying the "speaker", # "room" and session "description". self.no_paragraph = None def header(self, text, level, raw=None): global lps_dict if level == 2: # Add new day. lps_dict[text] = OrderedDict() self.last_day = text elif level == 3: # Add new timeslot lps_dict[self.last_day][text] = OrderedDict() self.last_time_slot = text elif level == 4: # Add new session lps_dict[self.last_day][self.last_time_slot][text] = OrderedDict() self.last_session = text # We found a new session; set no of paragraphs processed # to 0. self.no_paragraph = 0 return super(LPSRenderer, self).header(text, level, raw) def paragraph(self, text): global lps_dict p = super(LPSRenderer, self).paragraph(text) if self.no_paragraph == 0: # Speaker speakers = text.split(', ') lps_dict[self.last_day][self.last_time_slot][ self.last_session]['speakers'] = speakers self.no_paragraph = self.no_paragraph + 1 elif self.no_paragraph == 1: # Room lps_dict[self.last_day][self.last_time_slot][ self.last_session]['room'] = text # Initialize description lps_dict[self.last_day][self.last_time_slot][ self.last_session]['desc'] = [] self.no_paragraph = self.no_paragraph + 1 elif self.no_paragraph > 1: lps_dict[self.last_day][self.last_time_slot][ self.last_session]['desc'].append(text) return p class LPSpeakersRenderer(Renderer): """Helps in converting Markdown version of LP speakers to a dictionary. """ def __init__(self, **kwargs): super(LPSpeakersRenderer, self).__init__(**kwargs) global lpspeakers_dict lpspeakers_dict = OrderedDict() lpspeakers_dict['keynote-speakers'] = [] lpspeakers_dict['speakers'] = [] # Type of present speaker being processed; can either be # 'keynote-speakers' or 'speakers'.' self.speaker_type = None # Maintain a list of used IDs self.used_ids = [] def mk_uid(self, text): """Returns a unique id. """ # 'John HÖcker, Onion Project' -> 'John HÖcker' text = text.split(', ')[0] # 'John HÖcker' -> 'John Hacker' ascii_text = unidecode(unicode(text)) # 'John Hacker' -> 'hacker' id_ = ascii_text.split()[-1].lower() if id_ not in self.used_ids: self.used_ids.append(id_) return id_ else: # 'John Hacker' -> 'john_hacker' id_ = '_'.join([s.lower() for s in ascii_text.split()]) self.used_ids.append(id_) return id_ def header(self, text, level, raw=None): global lpspeakers_dict if level == 1: self.speaker_type = 'keynote-speakers' lpspeakers_dict[self.speaker_type].append(OrderedDict()) lpspeakers_dict[self.speaker_type][-1]['speaker'] = text lpspeakers_dict[self.speaker_type][-1]['id'] = self.mk_uid(text) lpspeakers_dict[self.speaker_type][-1]['bio'] = [] elif level == 2: self.speaker_type = 'speakers' lpspeakers_dict[self.speaker_type].append(OrderedDict()) lpspeakers_dict[self.speaker_type][-1]['speaker'] = text.split(', ')[0] lpspeakers_dict[self.speaker_type][-1]['id'] = self.mk_uid(text) lpspeakers_dict[self.speaker_type][-1]['bio'] = [] return super(LPSpeakersRenderer, self).header(text, level, raw) def image(self, src, title, text): global lpspeakers_dict lpspeakers_dict[self.speaker_type][-1]['img_url'] = src lpspeakers_dict[self.speaker_type][-1]['img_alt'] = text return super(LPSpeakersRenderer, self).image(src, title, text) def paragraph(self, text): global lpspeakers_dict p = super(LPSpeakersRenderer, self).paragraph(text) if text.startswith('