SiteGenerator/gsitegen/generate.py

from html5tagger import Document, E, HTML
import shutil
import markdown
import html
from pathlib import Path

def parseLink(link, pagetitle, homepage):
  if link.strip() == pagetitle + ".page":
    return "#"
  elif link.strip() == homepage + ".page":
    return "/"
  else:
    destination = link.replace(" ", "-").replace(".page", "").lower()

    #Start local links with / symbol
    if link.strip().endswith(".page"):
      return "/" + destination
    return destination

def generateNavigationBar(lines, pagetitle):
  global navbar
  navbar = E
  rawhtml = False
  htmlstring = ""
  dropdown = False
  for id, line in enumerate(lines):

    #parse raw HTML
    rawhtml, navbar, htmlstring = parseRawHTML(navbar, line, htmlstring, rawhtml, id, len(lines))

    #parse navigation bar (custom format)
    if not rawhtml:
      if ";" in line:
        title, link = line.split(";", 1)

        if line.strip().endswith("|"):
          dropdown = True
          link = link.strip()[:len(link.strip())-1]
          dphtml = E

          #some duplicate logic as normal navbar entries get, to make dropdown button in itself act like a normal clickable navbar entry
          link = parseLink(link, pagetitle, homepage)
          if link.strip() == "#":
            dphtml = dphtml(HTML("<div class='dropdown'><div class='dropbutton'><div class='active'><a href='" + link.strip() + "'>" + title + "</a></div></div><div class='dropdown-content'>"))
          else:
            dphtml = dphtml(HTML("<div class='dropdown'><div class='dropbutton'><a href='" + link.strip() + "'>" + title + "</a></div><div class='dropdown-content'>"))
          continue

        elif dropdown:
          if line.startswith("  "):

            link = parseLink(link, pagetitle, homepage)
            if link.strip() == "#":
              dphtml = dphtml(HTML("<div class='active'><a href='" + link.strip() + "'>" + title + "</a></div>"))
            else:
              dphtml = dphtml(HTML("<a href='" + link.strip() + "'>" + title + "</a>"))

            #handle end of indentation (if indented line is the last line of page or next line is not indented)
            if len(lines) - id == 1 or lines[id + 1].startswith("  ") is False:
              dphtml = dphtml(HTML("</div></div>"))
              navbar = navbar.li(dphtml)
              dropdown = False
            continue

		#mark currently open tab as active when it is open
        link = parseLink(link, pagetitle, homepage)
        if link.strip() == "#":
          navbar = navbar.li(HTML("<div class='active'>" + "<a href='" + link.strip() + "'>" + title + "</a></div>"))
          continue

        navbar = navbar.li(HTML("<a href='" + link.strip() + "'>" + title + "</a>"))
      else:
        print("Error: invalid navbar entry, line " + str(id + 1) + " content: " + line)
        exit()
  return navbar

def generateFooter(lines):
  global footer
  footer = E
  rawhtml = False
  htmlstring = ""
  for id, line in enumerate(lines):

    #parse raw HTML
    rawhtml, footer, htmlstring = parseRawHTML(footer, line, htmlstring, rawhtml, id, len(lines))

    #parse markdown
    if not rawhtml:
      footer = footer.li(HTML(parseMarkdown(footer, line)))

def parseRawHTML(doc, line, htmlstring, rawhtml, id, maxlines):

  #raw html start
  if line.strip() == ">":
    rawhtml = True
    htmlstring = ""

  #parse indented raw html
  elif rawhtml:
    if line.startswith("  "):

      #experimental markdown inside HTML support
      htmlstring = htmlstring + html.unescape(markdown.markdown(html.escape(line.strip())))

      #if indented html was the last line, this is needed for it to not be ignored
      #since this is the end of the file, we will not set rawhtml to False.
      if maxlines - id == 1:
        doc.div(HTML(htmlstring))
    else:
      rawhtml = False
      doc.div(HTML(htmlstring))
      htmlstring = ""

  return rawhtml, doc, htmlstring

def parseMarkdown(doc, line):

  #do not allow HTML in markdown
  line = html.escape(line.strip())
  return markdown.markdown(line)

def generateLines(title, lines):
  title = title.replace(".page", "")
  doc = Document(title, lang="en")
  rawhtml = False
  htmlstring = ""
  for id, line in enumerate(lines):

    #parse raw HTML
    rawhtml, doc, htmlstring = parseRawHTML(doc, line, htmlstring, rawhtml, id, len(lines))

    #parse markdown
    if not rawhtml:
      doc = doc(HTML(parseMarkdown(doc, line)))

  generatePage(title, doc)

def generatePage(title, doc):
  global pages
  global titles
  if 'pages' not in globals():
    pages = []
  if 'titles' not in globals():
    titles = []

  navbarfile = Path(__file__).parent.joinpath('navbar')

  if navbarfile.exists():
    with navbarfile.open('r') as navbarfile:
      navbar = generateNavigationBar(navbarfile.readlines(), title)

    if 'footer' in globals():
      pages.append(str(E.ul(navbar)) + str(doc) + str(E.ul(footer)))
    else:
      pages.append(str(E.ul(navbar)) + str(doc))
  else:
    print("No 'navbar' file found, there will be no navigation bar.")

    if 'footer' in globals():
      pages.append(str(doc) + str(E.ul(footer)))
    else:
      pages.append(str(doc))

  titles.append(title)

def writePages():
  global pages
  global titles
    #TODO only delete files that aren't present in newest site generation
    #deleting contents of folder without deleting the folder, to increase compatibility with various systems
    #for root, dirs, files in os.walk('./website-output'):
    #  for f in files:
    #    os.unlink(os.path.join(root, f))
    #  for d in dirs:
    #    rmtree(os.path.join(root, d))

  for id, page in enumerate(pages):
    foldername = ""

    #creates ./website-output/pagetitle/index.html file if it is not homepage
    if titles[id] != homepage:
      foldername = titles[id].replace(" ", "-").lower()

    outputpath = Path(__file__).parent.joinpath("website-output")

    dirpath = outputpath.joinpath(foldername)

    dirpath.mkdir(parents=True, exist_ok=True)

    filepath = dirpath.joinpath("index.html")

    if filepath.exists():
      with filepath.open('r') as newpage:
        if newpage.read() == page:
          print("Page not changed: " + titles[id])
          continue

    with filepath.open('w') as newpage:
      newpage.write(page)
      print("Written changed page: " + titles[id])

  #resources
  respath = Path(__file__).parent.joinpath("resources")
  if respath.exists():

    #shutil.copytree copies timestamp too
    shutil.copytree(respath, outputpath, dirs_exist_ok=True)

    #check if folders are named correctly
    for folder in outputpath.iterdir():
      if folder.is_dir():

        #rename folder name format from "About Page" to "about-page"
        bettername = folder.name.replace(" ", "-").lower()

        if folder.name != bettername:
          newpath = outputpath.joinpath(bettername)

          #example: resources folder is "About", page got auto-created earlier as "about" (from About.page), let's copy "About" resources to "about" and delete "About"
          if newpath.exists():
            shutil.copytree(folder, newpath, dirs_exist_ok=True)
            shutil.rmtree(folder)
          else:
            shutil.move(str(folder), newpath)

def main():

  #if homepage is at Home.page, set homepage to "Home"
  global homepage
  homepage = "Home"

  footerfile = Path(__file__).parent.joinpath('footer')

  if footerfile.exists():
    with footerfile.open('r') as footerfile:
      generateFooter(footerfile.readlines())
  else:
    print("No 'footer' file found, there will be no footer.")

  pagescount = 0

  for file in Path(__file__).parent.iterdir():
    if file.is_file():
      if file.suffix == ".page":
        pagescount += 1
        with file.open('r') as page:
          generateLines(file.stem, page.readlines())
  print("Found " + str(pagescount) + " pages")

  #write all pages to files
  writePages()

if __name__ == "__main__":
  main()
Start using html5tagger better 2022-01-22 09:26:09 +00:00			`from html5tagger import Document, E, HTML`
More flexible resources implementation 2022-02-01 16:36:30 +00:00			`import shutil`
Basic markdown and raw HTML support 2022-01-24 10:09:04 +00:00			`import markdown`
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00			`import html`
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00			`from pathlib import Path`
Initial commit 2022-01-21 10:16:26 +00:00
Finish dropdown in navbar 2022-02-07 12:18:31 +00:00			`def parseLink(link, pagetitle, homepage):`
			`if link.strip() == pagetitle + ".page":`
			`return "#"`
			`elif link.strip() == homepage + ".page":`
			`return "/"`
			`else:`
			`destination = link.replace(" ", "-").replace(".page", "").lower()`

			`#Start local links with / symbol`
			`if link.strip().endswith(".page"):`
			`return "/" + destination`
			`return destination`

Better navbar styling support 2022-02-03 13:34:15 +00:00			`def generateNavigationBar(lines, pagetitle):`
Progress on making code cleaner 2022-01-22 09:54:31 +00:00			`global navbar`
			`navbar = E`
Unfinished navigation bar remake 2022-01-25 14:05:07 +00:00			`rawhtml = False`
			`htmlstring = ""`
Improve navbar, unfinished dropdown support 2022-02-04 17:29:07 +00:00			`dropdown = False`
Better parseRawHTML function 2022-01-24 13:20:08 +00:00			`for id, line in enumerate(lines):`
Fix line after raw html not working 2022-01-24 10:35:29 +00:00
Unfinished navigation bar remake 2022-01-25 14:05:07 +00:00			`#parse raw HTML`
			`rawhtml, navbar, htmlstring = parseRawHTML(navbar, line, htmlstring, rawhtml, id, len(lines))`

Better navbar styling support 2022-02-03 13:34:15 +00:00			`#parse navigation bar (custom format)`
Unfinished navigation bar remake 2022-01-25 14:05:07 +00:00			`if not rawhtml:`
Experimental styling support for navigation bar 2022-02-02 14:51:46 +00:00			`if ";" in line:`
			`title, link = line.split(";", 1)`

Improve navbar, unfinished dropdown support 2022-02-04 17:29:07 +00:00			`if line.strip().endswith("\|"):`
			`dropdown = True`
Finish dropdown in navbar 2022-02-07 12:18:31 +00:00			`link = link.strip()[:len(link.strip())-1]`
Improve navbar, unfinished dropdown support 2022-02-04 17:29:07 +00:00			`dphtml = E`
Finish dropdown in navbar 2022-02-07 12:18:31 +00:00
			`#some duplicate logic as normal navbar entries get, to make dropdown button in itself act like a normal clickable navbar entry`
			`link = parseLink(link, pagetitle, homepage)`
			`if link.strip() == "#":`
			`dphtml = dphtml(HTML("<div class='dropdown'><div class='dropbutton'><div class='active'><a href='" + link.strip() + "'>" + title + "</a></div></div><div class='dropdown-content'>"))`
			`else:`
			`dphtml = dphtml(HTML("<div class='dropdown'><div class='dropbutton'><a href='" + link.strip() + "'>" + title + "</a></div><div class='dropdown-content'>"))`
			`continue`

Improve navbar, unfinished dropdown support 2022-02-04 17:29:07 +00:00			`elif dropdown:`
			`if line.startswith(" "):`
Finish dropdown in navbar 2022-02-07 12:18:31 +00:00
			`link = parseLink(link, pagetitle, homepage)`
			`if link.strip() == "#":`
			`dphtml = dphtml(HTML("<div class='active'><a href='" + link.strip() + "'>" + title + "</a></div>"))`
			`else:`
			`dphtml = dphtml(HTML("<a href='" + link.strip() + "'>" + title + "</a>"))`

			`#handle end of indentation (if indented line is the last line of page or next line is not indented)`
			`if len(lines) - id == 1 or lines[id + 1].startswith(" ") is False:`
			`dphtml = dphtml(HTML("</div></div>"))`
			`navbar = navbar.li(dphtml)`
			`dropdown = False`
Improve navbar, unfinished dropdown support 2022-02-04 17:29:07 +00:00			`continue`
Finish dropdown in navbar 2022-02-07 12:18:31 +00:00
Better navbar styling support 2022-02-03 13:34:15 +00:00			`#mark currently open tab as active when it is open`
Finish dropdown in navbar 2022-02-07 12:18:31 +00:00			`link = parseLink(link, pagetitle, homepage)`
			`if link.strip() == "#":`
Improve navbar, unfinished dropdown support 2022-02-04 17:29:07 +00:00			`navbar = navbar.li(HTML("<div class='active'>" + "<a href='" + link.strip() + "'>" + title + "</a></div>"))`
Finish dropdown in navbar 2022-02-07 12:18:31 +00:00			`continue`

			`navbar = navbar.li(HTML("<a href='" + link.strip() + "'>" + title + "</a>"))`
Bugfixes to navbar styling 2022-02-03 14:35:28 +00:00			`else:`
			`print("Error: invalid navbar entry, line " + str(id + 1) + " content: " + line)`
			`exit()`
Better navbar styling support 2022-02-03 13:34:15 +00:00			`return navbar`
Finish dropdown in navbar 2022-02-07 12:18:31 +00:00
Experimental footer, identical to navbar 2022-01-31 10:11:51 +00:00			`def generateFooter(lines):`
			`global footer`
			`footer = E`
			`rawhtml = False`
			`htmlstring = ""`
			`for id, line in enumerate(lines):`

			`#parse raw HTML`
			`rawhtml, footer, htmlstring = parseRawHTML(footer, line, htmlstring, rawhtml, id, len(lines))`

			`#parse markdown`
			`if not rawhtml:`
			`footer = footer.li(HTML(parseMarkdown(footer, line)))`

Better parseRawHTML function 2022-01-24 13:20:08 +00:00			`def parseRawHTML(doc, line, htmlstring, rawhtml, id, maxlines):`
More code cleanup 2022-01-26 10:36:59 +00:00
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00			`#raw html start`
			`if line.strip() == ">":`
			`rawhtml = True`
			`htmlstring = ""`

			`#parse indented raw html`
			`elif rawhtml:`
			`if line.startswith(" "):`
Experimental Markdown inside HTML support 2022-01-24 14:23:07 +00:00
			`#experimental markdown inside HTML support`
			`htmlstring = htmlstring + html.unescape(markdown.markdown(html.escape(line.strip())))`
Better parseRawHTML function 2022-01-24 13:20:08 +00:00
			`#if indented html was the last line, this is needed for it to not be ignored`
Small improvement 2022-01-24 14:06:16 +00:00			`#since this is the end of the file, we will not set rawhtml to False.`
Better parseRawHTML function 2022-01-24 13:20:08 +00:00			`if maxlines - id == 1:`
			`doc.div(HTML(htmlstring))`
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00			`else:`
			`rawhtml = False`
Better parseRawHTML function 2022-01-24 13:20:08 +00:00			`doc.div(HTML(htmlstring))`
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00			`htmlstring = ""`
Experimental styling support for navigation bar 2022-02-02 14:51:46 +00:00
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00			`return rawhtml, doc, htmlstring`

			`def parseMarkdown(doc, line):`
More code cleanup 2022-01-26 10:36:59 +00:00
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00			`#do not allow HTML in markdown`
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00			`line = html.escape(line.strip())`
Further navigation improvements, start of remaking compiling process 2022-01-25 14:45:27 +00:00			`return markdown.markdown(line)`
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00
Functions 2022-01-22 14:06:25 +00:00			`def generateLines(title, lines):`
			`title = title.replace(".page", "")`
Cleanup document, remove unnecessary join 2022-01-24 10:25:29 +00:00			`doc = Document(title, lang="en")`
Basic markdown and raw HTML support 2022-01-24 10:09:04 +00:00			`rawhtml = False`
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00			`htmlstring = ""`
Better parseRawHTML function 2022-01-24 13:20:08 +00:00			`for id, line in enumerate(lines):`
Basic markdown and raw HTML support 2022-01-24 10:09:04 +00:00
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00			`#parse raw HTML`
Better parseRawHTML function 2022-01-24 13:20:08 +00:00			`rawhtml, doc, htmlstring = parseRawHTML(doc, line, htmlstring, rawhtml, id, len(lines))`
Basic markdown and raw HTML support 2022-01-24 10:09:04 +00:00
			`#parse markdown`
escape HTML in markdown, more functions 2022-01-24 12:43:28 +00:00			`if not rawhtml:`
Further navigation improvements, start of remaking compiling process 2022-01-25 14:45:27 +00:00			`doc = doc(HTML(parseMarkdown(doc, line)))`
Basic markdown and raw HTML support 2022-01-24 10:09:04 +00:00
Cleanup document, remove unnecessary join 2022-01-24 10:25:29 +00:00			`generatePage(title, doc)`
Functions 2022-01-22 14:06:25 +00:00
Cleanup document, remove unnecessary join 2022-01-24 10:25:29 +00:00			`def generatePage(title, doc):`
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00			`global pages`
			`global titles`
			`if 'pages' not in globals():`
			`pages = []`
			`if 'titles' not in globals():`
			`titles = []`
Small code reduction 2022-01-26 10:08:19 +00:00
Better navbar styling support 2022-02-03 13:34:15 +00:00			`navbarfile = Path(__file__).parent.joinpath('navbar')`

			`if navbarfile.exists():`
			`with navbarfile.open('r') as navbarfile:`
			`navbar = generateNavigationBar(navbarfile.readlines(), title)`

Experimental footer, identical to navbar 2022-01-31 10:11:51 +00:00			`if 'footer' in globals():`
			`pages.append(str(E.ul(navbar)) + str(doc) + str(E.ul(footer)))`
			`else:`
			`pages.append(str(E.ul(navbar)) + str(doc))`
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00			`else:`
Better navbar styling support 2022-02-03 13:34:15 +00:00			`print("No 'navbar' file found, there will be no navigation bar.")`

Experimental footer, identical to navbar 2022-01-31 10:11:51 +00:00			`if 'footer' in globals():`
			`pages.append(str(doc) + str(E.ul(footer)))`
			`else:`
			`pages.append(str(doc))`
Better navbar styling support 2022-02-03 13:34:15 +00:00
More code cleanup 2022-01-26 10:36:59 +00:00			`titles.append(title)`
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00
Better navbar styling support 2022-02-03 13:34:15 +00:00			`def writePages():`
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00			`global pages`
			`global titles`
			`#TODO only delete files that aren't present in newest site generation`
			`#deleting contents of folder without deleting the folder, to increase compatibility with various systems`
			`#for root, dirs, files in os.walk('./website-output'):`
			`# for f in files:`
			`# os.unlink(os.path.join(root, f))`
			`# for d in dirs:`
			`# rmtree(os.path.join(root, d))`

			`for id, page in enumerate(pages):`
			`foldername = ""`
More code cleanup 2022-01-26 10:36:59 +00:00
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00			`#creates ./website-output/pagetitle/index.html file if it is not homepage`
			`if titles[id] != homepage:`
More flexible resources implementation 2022-02-01 16:36:30 +00:00			`foldername = titles[id].replace(" ", "-").lower()`

			`outputpath = Path(__file__).parent.joinpath("website-output")`

			`dirpath = outputpath.joinpath(foldername)`
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00
Use pathlib more wisely 2022-01-27 11:02:35 +00:00			`dirpath.mkdir(parents=True, exist_ok=True)`
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00
Use pathlib more wisely 2022-01-27 11:02:35 +00:00			`filepath = dirpath.joinpath("index.html")`
More pathlib usage & code cleanup 2022-01-27 10:11:33 +00:00
Completely migrate to pathlib 2022-01-27 10:29:24 +00:00			`if filepath.exists():`
			`with filepath.open('r') as newpage:`
Small code reduction 2022-01-26 10:08:19 +00:00			`if newpage.read() == page:`
More code cleanup 2022-01-26 10:36:59 +00:00			`print("Page not changed: " + titles[id])`
			`continue`
More pathlib usage & code cleanup 2022-01-27 10:11:33 +00:00
Completely migrate to pathlib 2022-01-27 10:29:24 +00:00			`with filepath.open('w') as newpage:`
More code cleanup 2022-01-26 10:36:59 +00:00			`newpage.write(page)`
			`print("Written changed page: " + titles[id])`
Use main() 2022-01-24 16:49:02 +00:00
Add basic resources support 2022-01-31 10:56:41 +00:00			`#resources`
			`respath = Path(__file__).parent.joinpath("resources")`
			`if respath.exists():`
More flexible resources implementation 2022-02-01 16:36:30 +00:00
			`#shutil.copytree copies timestamp too`
			`shutil.copytree(respath, outputpath, dirs_exist_ok=True)`

			`#check if folders are named correctly`
			`for folder in outputpath.iterdir():`
			`if folder.is_dir():`

			`#rename folder name format from "About Page" to "about-page"`
			`bettername = folder.name.replace(" ", "-").lower()`

			`if folder.name != bettername:`
			`newpath = outputpath.joinpath(bettername)`

			`#example: resources folder is "About", page got auto-created earlier as "about" (from About.page), let's copy "About" resources to "about" and delete "About"`
			`if newpath.exists():`
			`shutil.copytree(folder, newpath, dirs_exist_ok=True)`
			`shutil.rmtree(folder)`
			`else:`
			`shutil.move(str(folder), newpath)`

Use main() 2022-01-24 16:49:02 +00:00			`def main():`
More code cleanup 2022-01-26 10:36:59 +00:00
Use main() 2022-01-24 16:49:02 +00:00			`#if homepage is at Home.page, set homepage to "Home"`
Better navbar styling support 2022-02-03 13:34:15 +00:00			`global homepage`
Use main() 2022-01-24 16:49:02 +00:00			`homepage = "Home"`

Experimental footer, identical to navbar 2022-01-31 10:11:51 +00:00			`footerfile = Path(__file__).parent.joinpath('footer')`

			`if footerfile.exists():`
			`with footerfile.open('r') as footerfile:`
			`generateFooter(footerfile.readlines())`
			`else:`
			`print("No 'footer' file found, there will be no footer.")`

Use main() 2022-01-24 16:49:02 +00:00			`pagescount = 0`
Completely migrate to pathlib 2022-01-27 10:29:24 +00:00
			`for file in Path(__file__).parent.iterdir():`
			`if file.is_file():`
Use pathlib more wisely 2022-01-27 11:02:35 +00:00			`if file.suffix == ".page":`
Completely migrate to pathlib 2022-01-27 10:29:24 +00:00			`pagescount += 1`
			`with file.open('r') as page:`
Remove unused comment 2022-01-27 11:03:53 +00:00			`generateLines(file.stem, page.readlines())`
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00			`print("Found " + str(pagescount) + " pages")`

More code cleanup 2022-01-26 10:36:59 +00:00			`#write all pages to files`
Better navbar styling support 2022-02-03 13:34:15 +00:00			`writePages()`
Use main() 2022-01-24 16:49:02 +00:00
			`if __name__ == "__main__":`
Only change edited pages, W.I.P 2022-01-26 10:03:25 +00:00			`main()`