pzimediadesign/mmdc_pages.py

#! /usr/bin/env python
# -*- coding: utf-8 -*-

##############
# FROM THE JSON DICTIONARY CREATE AN INDEX PAGE
#####
import xml.etree.ElementTree as ET
import html5lib, urllib2, json, pprint, re
from mmdc_modules import api_thumb_url, pandoc2html, img_fullurl, api_file_url,  write_html_file
#import mmdc_create_json import api_thumb_url
json_allworks_file = open('allworks_mmdc.json', 'r') # save json 
json_allworks = json.loads(json_allworks_file.read())
pages_path = 'web/work'

#def generate_xml():
gallery_exp=re.compile('<gallery>.*?</gallery>')
file_exp=re.compile('File:(.*?)(?=File:|<\/gallery>)')
img_exp=re.compile('(File:|Image:)((.*?)\.(gif|jpg|jpeg|png))(?=\||File:|Image:|<\/gallery>)', re.I)
video_exp=re.compile('\{\{(.*?)\|(.*?)\}\}')

def replace_gallery(content):
    # from <gallery>.*</gallery> imgs, return list of img ET elements
    # replace <gallery>.*</gallery> with ''
    gallery_imgs = []
    gallery_found = re.findall(gallery_exp, content)
    content = re.sub(gallery_exp,  '', content)
    for gallery in gallery_found: # in case there is more than 1 <gallery>
        allfiles =re.findall(img_exp, gallery)
        for imgfile in allfiles:
            imgfile = imgfile[1]
            imgsrc = api_file_url(imgfile) # search for original image
            img_el = ET.Element('img', attrib={'src': imgsrc})
            gallery_imgs.append(img_el)
    return content, gallery_imgs

def replace_video(content):
    videos = []
    videos_found = re.findall(video_exp, content)
    for video in videos_found:
        video_provider =  str(video[0])
        video_hash = str(video[1])
        video_src = None
        if (video_provider.lower()) == 'youtube':            
            video_src="https://www.youtube.com/embed/" + video_hash
        elif (video_provider.lower()) == 'vimeo':            
            video_src="https://player.vimeo.com/video/" + video_hash
        if video_src:
            iframe_el = ET.Element('iframe', attrib={'src':video_src,  'width':'600px', 'height':'450px'})
            videos.append(iframe_el)
    content = re.sub(video_exp,  '', content)
    return content, videos
    
def create_workpage( allworks_dict, work_key, tree): # replace text content in dict with html nodes, holding the content    
    for key in allworks_dict.keys():
        div_header = (tree.findall(".//div[@class='header']"))[0]
        div_body = (tree.findall(".//div[@class='body']"))[0]
        div_av = (tree.findall(".//div[@class='av']"))[0]
        
        if key in ['Description', 'Extra']: 
            mw_content = allworks_dict[key]
            if re.search(gallery_exp, mw_content):
                mw_content, gallery_imgs = replace_gallery(mw_content)
                allworks_dict['Images'] = gallery_imgs
            elif re.search(video_exp, mw_content):
                mw_content, videos = replace_video(mw_content)
                allworks_dict['Video'] = videos
    
            allworks_dict[key] = pandoc2html( mw_content if key in allworks_dict.keys() else '' ) # convert to HTML
            work_el = html5lib.parseFragment(allworks_dict[key], namespaceHTMLElements=False)

            div_body.append( work_el )
            
            print "****************************"
            print ET.tostring(div_body)
            print "****************************"
        elif key in ['Website']:
            work_el = ET.Element('a', attrib={'href': allworks_dict[key], 'id':key})
            work_el.text = 'LINK'#allworks_dict[key]
        elif key in ['Title']:
            work_el = ET.Element('h1', attrib={'id': key})
            work_el.text = allworks_dict[key]

            # typeerror: must be Element, not Element
            # div_header.append(work_el)


        elif key in ['Creator', 'Date', 'Bio']:
            work_el = ET.Element('p', attrib={'id': key})
            work_el.text = allworks_dict[key]
        elif key in ['Thumbnail']:
            work_el = ET.Element('img', attrib={'src': allworks_dict[key], 'id': key})
            print ET.tostring(work_el)
        else:
            work_el = None       # remove keys with None value?
        allworks_dict[key] = work_el
        allworks_dict.pop('Thumbnail_url', None) #remove Thumbnail_url
    pprint.pprint(allworks_dict)

            
def edit_index(filepath, json_allworks_dict):
    input_file = open(filepath, 'r') 
    tree = html5lib.parse(input_file, namespaceHTMLElements=False)
    div_section02 = (tree.findall(".//div[@id='section02']"))[0]
    for key in json_allworks_dict.keys():
        graduation_work=json_allworks_dict[key]
        insert_work(div_section02, 'Graduation_work thumbnail', graduation_work, key )
    return tree


worktemplate = open('web/work.html', 'r') 
for key in json_allworks.keys():
        graduation_work=json_allworks[key]
        graduation_work_title = (json_allworks[key]['Title']).encode('ascii', 'ignore')
        work_file = 'web/' + key + '-' + graduation_work_title + '.html'
        work_tree = html5lib.parse(worktemplate, namespaceHTMLElements=False)
        create_workpage(graduation_work, key, work_tree )
        write_html_file(work_tree, work_file)
        print '----------'
#        print ET.tostring(work_tree)
        print graduation_work['Creator']
        print graduation_work_title
        
        print '----------'
mmdc_pages.py pandoc conversion working 9 years ago			`#! /usr/bin/env python`
			`# -- coding: utf-8 --`

			`##############`
			`# FROM THE JSON DICTIONARY CREATE AN INDEX PAGE`
			`#####`
			`import xml.etree.ElementTree as ET`
			`import html5lib, urllib2, json, pprint, re`
creating work page 9 years ago			`from mmdc_modules import api_thumb_url, pandoc2html, img_fullurl, api_file_url, write_html_file`
creating pages makeing script 9 years ago			`#import mmdc_create_json import api_thumb_url`
mmdc_pages.py pandoc conversion working 9 years ago			`json_allworks_file = open('allworks_mmdc.json', 'r') # save json`
			`json_allworks = json.loads(json_allworks_file.read())`
			`pages_path = 'web/work'`

creating pages makeing script 9 years ago			`#def generate_xml():`
quick n dirty gallery replacement 9 years ago			`gallery_exp=re.compile('<gallery>.*?</gallery>')`
			`file_exp=re.compile('File:(.*?)(?=File:\|<\/gallery>)')`
video to iframes 9 years ago			`img_exp=re.compile('(File:\|Image:)((.*?)\.(gif\|jpg\|jpeg\|png))(?=\\|\|File:\|Image:\|<\/gallery>)', re.I)`
			`video_exp=re.compile('\{\{(.?)\\|(.?)\}\}')`
quick n dirty gallery replacement 9 years ago
			`def replace_gallery(content):`
			`# from <gallery>.*</gallery> imgs, return list of img ET elements`
			`# replace <gallery>.*</gallery> with ''`
			`gallery_imgs = []`
			`gallery_found = re.findall(gallery_exp, content)`
			`content = re.sub(gallery_exp, '', content)`
			`for gallery in gallery_found: # in case there is more than 1 <gallery>`
refined gallery regex 9 years ago			`allfiles =re.findall(img_exp, gallery)`
quick n dirty gallery replacement 9 years ago			`for imgfile in allfiles:`
video to iframes 9 years ago			`imgfile = imgfile[1]`
			`imgsrc = api_file_url(imgfile) # search for original image`
quick n dirty gallery replacement 9 years ago			`img_el = ET.Element('img', attrib={'src': imgsrc})`
			`gallery_imgs.append(img_el)`
			`return content, gallery_imgs`
video to iframes 9 years ago
			`def replace_video(content):`
			`videos = []`
			`videos_found = re.findall(video_exp, content)`
			`for video in videos_found:`
			`video_provider = str(video[0])`
			`video_hash = str(video[1])`
			`video_src = None`
			`if (video_provider.lower()) == 'youtube':`
			`video_src="https://www.youtube.com/embed/" + video_hash`
			`elif (video_provider.lower()) == 'vimeo':`
			`video_src="https://player.vimeo.com/video/" + video_hash`
			`if video_src:`
			`iframe_el = ET.Element('iframe', attrib={'src':video_src, 'width':'600px', 'height':'450px'})`
			`videos.append(iframe_el)`
			`content = re.sub(video_exp, '', content)`
			`return content, videos`
creating pages makeing script 9 years ago
creating work page 9 years ago			`def create_workpage( allworks_dict, work_key, tree): # replace text content in dict with html nodes, holding the content`
creating pages makeing script 9 years ago			`for key in allworks_dict.keys():`
creating work page 9 years ago			`div_header = (tree.findall(".//div[@class='header']"))[0]`
			`div_body = (tree.findall(".//div[@class='body']"))[0]`
			`div_av = (tree.findall(".//div[@class='av']"))[0]`

quick n dirty gallery replacement 9 years ago			`if key in ['Description', 'Extra']:`
			`mw_content = allworks_dict[key]`
			`if re.search(gallery_exp, mw_content):`
			`mw_content, gallery_imgs = replace_gallery(mw_content)`
video to iframes 9 years ago			`allworks_dict['Images'] = gallery_imgs`
			`elif re.search(video_exp, mw_content):`
			`mw_content, videos = replace_video(mw_content)`
			`allworks_dict['Video'] = videos`
creating work page 9 years ago
quick n dirty gallery replacement 9 years ago			`allworks_dict[key] = pandoc2html( mw_content if key in allworks_dict.keys() else '' ) # convert to HTML`
creating work page 9 years ago			`work_el = html5lib.parseFragment(allworks_dict[key], namespaceHTMLElements=False)`
quick n dirty gallery replacement 9 years ago
creating work page 9 years ago			`div_body.append( work_el )`
quick n dirty gallery replacement 9 years ago
creating work page 9 years ago			`print "****************************"`
			`print ET.tostring(div_body)`
			`print "****************************"`
creating pages makeing script 9 years ago			`elif key in ['Website']:`
creating work page 9 years ago			`work_el = ET.Element('a', attrib={'href': allworks_dict[key], 'id':key})`
			`work_el.text = 'LINK'#allworks_dict[key]`
creating pages makeing script 9 years ago			`elif key in ['Title']:`
creating work page 9 years ago			`work_el = ET.Element('h1', attrib={'id': key})`
			`work_el.text = allworks_dict[key]`

			`# typeerror: must be Element, not Element`
			`# div_header.append(work_el)`



creating pages makeing script 9 years ago			`elif key in ['Creator', 'Date', 'Bio']:`
creating work page 9 years ago			`work_el = ET.Element('p', attrib={'id': key})`
			`work_el.text = allworks_dict[key]`
			`elif key in ['Thumbnail']:`
			`work_el = ET.Element('img', attrib={'src': allworks_dict[key], 'id': key})`
			`print ET.tostring(work_el)`
creating pages makeing script 9 years ago			`else:`
creating work page 9 years ago			`work_el = None # remove keys with None value?`
			`allworks_dict[key] = work_el`
			`allworks_dict.pop('Thumbnail_url', None) #remove Thumbnail_url`
video to iframes 9 years ago			`pprint.pprint(allworks_dict)`
creating pages makeing script 9 years ago

creating work page 9 years ago			`def edit_index(filepath, json_allworks_dict):`
			`input_file = open(filepath, 'r')`
			`tree = html5lib.parse(input_file, namespaceHTMLElements=False)`
			`div_section02 = (tree.findall(".//div[@id='section02']"))[0]`
			`for key in json_allworks_dict.keys():`
			`graduation_work=json_allworks_dict[key]`
			`insert_work(div_section02, 'Graduation_work thumbnail', graduation_work, key )`
			`return tree`
creating pages makeing script 9 years ago

creating work page 9 years ago			`worktemplate = open('web/work.html', 'r')`
			`for key in json_allworks.keys():`
			`graduation_work=json_allworks[key]`
			`graduation_work_title = (json_allworks[key]['Title']).encode('ascii', 'ignore')`
			`work_file = 'web/' + key + '-' + graduation_work_title + '.html'`
			`work_tree = html5lib.parse(worktemplate, namespaceHTMLElements=False)`
			`create_workpage(graduation_work, key, work_tree )`
			`write_html_file(work_tree, work_file)`
			`print '----------'`
			`# print ET.tostring(work_tree)`
			`print graduation_work['Creator']`
			`print graduation_work_title`

creating pages makeing script 9 years ago			`print '----------'`