mirror of https://gitlab.com/octtspacc/staticoso
414 lines
14 KiB
Python
414 lines
14 KiB
Python
""" ================================= |
|
|
| This file is part of |
|
|
| staticoso |
|
|
| Just a simple Static Site Generator |
|
|
| |
|
|
| Licensed under the AGPLv3 license |
|
|
| Copyright (C) 2022, OctoSpacc |
|
|
| ================================= """
|
|
|
|
from Libs import htmlmin
|
|
from Libs.bs4 import BeautifulSoup
|
|
from Modules.HTML import *
|
|
from Modules.Markdown import *
|
|
from Modules.Pug import *
|
|
from Modules.Utils import *
|
|
|
|
def DashifyTitle(Title, Done=[]):
|
|
return UndupeStr(DashifyStr(Title), Done, '-')
|
|
|
|
def MakeLinkableTitle(Line, Title, DashTitle, Type):
|
|
if Type == 'md':
|
|
Index = Title.split(' ')[0].count('#')
|
|
return '<h{} id="{}">{}</h{}>'.format(Index, DashTitle, Title[Index+1:], Index)
|
|
elif Type == 'pug':
|
|
NewLine = ''
|
|
Index = Line.find('h')
|
|
NewLine += Line[:Index]
|
|
NewLine += "{}(id='{}')".format(Line[Index:Index+2], DashTitle)
|
|
NewLine += Line[Index+2:]
|
|
return NewLine
|
|
|
|
def GetTitle(Meta, Titles, Prefer='MetaTitle', BlogName=None):
|
|
if Prefer == 'BodyTitle':
|
|
Title = Titles[0].lstrip('#') if Titles else Meta['Title'] if Meta['Title'] else 'Untitled'
|
|
elif Prefer == 'MetaTitle':
|
|
Title = Meta['Title'] if Meta['Title'] else Titles[0].lstrip('#') if Titles else 'Untitled'
|
|
elif Prefer == 'HTMLTitle':
|
|
Title = Meta['HTMLTitle'] if Meta['HTMLTitle'] else Meta['Title'] if Meta['Title'] else Titles[0].lstrip('#') if Titles else 'Untitled'
|
|
if Meta['Type'] == 'Post' and BlogName:
|
|
Title += ' - ' + BlogName
|
|
return Title
|
|
|
|
def GetDescription(Meta, BodyDescription, Prefer='MetaDescription'):
|
|
if Prefer == 'BodyDescription':
|
|
Description = BodyDescription if BodyDescription else Meta['Description'] if Meta['Description'] else ''
|
|
elif Prefer == 'MetaDescription':
|
|
Description = Meta['Description'] if Meta['Description'] else BodyDescription if BodyDescription else ''
|
|
return Description
|
|
|
|
def GetImage(Meta, BodyImage, Prefer='MetaImage'):
|
|
if Prefer == 'BodyImage':
|
|
Image = BodyImage if BodyImage else Meta['Image'] if Meta['Image'] else ''
|
|
elif Prefer == 'MetaImage':
|
|
Image = Meta['Image'] if Meta['Image'] else BodyImage if BodyImage else ''
|
|
return Image
|
|
|
|
def MakeContentHeader(Meta, Locale, Categories=''):
|
|
Header = ''
|
|
for i in ['CreatedOn', 'EditedOn']:
|
|
if Meta[i]:
|
|
Header += '{} {} \n'.format(Locale[i], Meta[i])
|
|
if Categories:
|
|
Header += '{}: {} \n'.format(Locale['Categories'], Categories)
|
|
return markdown(Header)
|
|
|
|
def MakeCategoryLine(File, Meta):
|
|
Categories = ''
|
|
if Meta['Categories']:
|
|
for i in Meta['Categories']:
|
|
Categories += '[{}]({}{}.html) '.format(i, GetPathLevels(File) + 'Categories/', i)
|
|
return Categories
|
|
|
|
def GetHTMLPagesList(Pages, BlogName, SiteRoot, PathPrefix, Unite=[], Type='Page', Category=None, For='Menu', MarkdownExts=()):
|
|
List, ToPop, LastParent = '', [], []
|
|
IndexPages = Pages.copy()
|
|
for e in IndexPages:
|
|
if e[3]['Index'] == 'False' or e[3]['Index'] == 'None':
|
|
IndexPages.remove(e)
|
|
for i,e in enumerate(IndexPages):
|
|
if e[3]['Type'] != Type:
|
|
ToPop += [i]
|
|
ToPop = RevSort(ToPop)
|
|
for i in ToPop:
|
|
IndexPages.pop(i)
|
|
if Type == 'Page':
|
|
IndexPages = OrderPages(IndexPages)
|
|
for i,e in enumerate(Unite):
|
|
if e:
|
|
IndexPages.insert(i,[e,None,None,{'Type':Type,'Index':'True','Order':'Unite'}])
|
|
for File, Content, Titles, Meta in IndexPages:
|
|
if Meta['Type'] == Type and CanIndex(Meta['Index'], For) and (not Category or Category in Meta['Categories']):
|
|
Depth = (File.count('/') + 1) if Meta['Order'] != 'Unite' else 1
|
|
if Depth > 1 and Meta['Order'] != 'Unite':
|
|
CurParent = File.split('/')[:-1]
|
|
for i,s in enumerate(CurParent):
|
|
if LastParent != CurParent:
|
|
LastParent = CurParent
|
|
Levels = '- ' * (Depth-1+i)
|
|
if StripExt(File).endswith('index'):
|
|
Title = MakeListTitle(File, Meta, Titles, 'HTMLTitle', SiteRoot, BlogName, PathPrefix)
|
|
else:
|
|
Title = CurParent[Depth-2+i]
|
|
List += Levels + Title + '\n'
|
|
if not (Depth > 1 and StripExt(File).endswith('index')):
|
|
Levels = '- ' * Depth
|
|
if Meta['Order'] == 'Unite':
|
|
Title = File
|
|
else:
|
|
Title = MakeListTitle(File, Meta, Titles, 'HTMLTitle', SiteRoot, BlogName, PathPrefix)
|
|
List += Levels + Title + '\n'
|
|
return markdown(MarkdownHTMLEscape(List, MarkdownExts), extensions=MarkdownExts)
|
|
|
|
def Preprocessor(Path, SiteRoot):
|
|
File = ReadFile(Path)
|
|
Content, Titles, DashyTitles, Meta = '', [], [], {
|
|
'Template': 'Standard.html',
|
|
'Style': '',
|
|
'Type': '',
|
|
'Index': 'True',
|
|
'Title': '',
|
|
'HTMLTitle': '',
|
|
'Description': '',
|
|
'Image': '',
|
|
'Categories': [],
|
|
'CreatedOn': '',
|
|
'EditedOn': '',
|
|
'Order': None}
|
|
for l in File.splitlines():
|
|
ls = l.lstrip()
|
|
if ls.startswith('// '):
|
|
lss = ls[3:]
|
|
for Item in ('Template', 'Type', 'Index', 'Title', 'HTMLTitle', 'Description', 'Image', 'CreatedOn', 'EditedOn'):
|
|
ItemText = '{}: '.format(Item)
|
|
if lss.startswith(ItemText):
|
|
Meta[Item] = lss[len(ItemText):]
|
|
if lss.startswith('Categories: '):
|
|
for i in lss[len('Categories: '):].split(' '):
|
|
Meta['Categories'] += [i]
|
|
elif lss.startswith('Background: '):
|
|
Meta['Style'] += "#MainBox{Background:" + lss[len('Background: '):] + ";} "
|
|
elif lss.startswith('Style: '):
|
|
Meta['Style'] += lss[len('Style: '):] + ' '
|
|
elif lss.startswith('Order: '):
|
|
Meta['Order'] = int(lss[len('Order: '):])
|
|
else:
|
|
if Path.endswith('.md'):
|
|
if ls.startswith('#'):
|
|
DashTitle = DashifyTitle(l.lstrip('#'), DashyTitles)
|
|
DashyTitles += [DashTitle]
|
|
Titles += [l]
|
|
Content += MakeLinkableTitle(l, ls, DashTitle, 'md') + '\n'
|
|
else:
|
|
Content += l + '\n'
|
|
elif Path.endswith('.pug'):
|
|
if ls.startswith(('h1', 'h2', 'h3', 'h4', 'h5', 'h6')):
|
|
if ls[2:].startswith(("(class='NoTitle", '(class="NoTitle')):
|
|
Content += l + '\n'
|
|
else:
|
|
Title = '#'*int(ls[1]) + str(ls[3:])
|
|
DashTitle = DashifyTitle(Title.lstrip('#'), DashyTitles)
|
|
DashyTitles += [DashTitle]
|
|
Titles += [Title]
|
|
# TODO: We should handle headers that for any reason already have parenthesis
|
|
if ls[2:] == '(':
|
|
Content += l + '\n'
|
|
else:
|
|
Content += MakeLinkableTitle(l, Title, DashTitle, 'pug') + '\n'
|
|
else:
|
|
Content += l + '\n'
|
|
return Content, Titles, Meta
|
|
|
|
def MakeListTitle(File, Meta, Titles, Prefer, SiteRoot, BlogName, PathPrefix=''):
|
|
Title = GetTitle(Meta, Titles, Prefer, BlogName)
|
|
Link = False if Meta['Index'] == 'Unlinked' else True
|
|
if Link:
|
|
Title = '[{}]({})'.format(
|
|
Title,
|
|
'{}{}.html'.format(PathPrefix, StripExt(File)))
|
|
if Meta['Type'] == 'Post':
|
|
CreatedOn = Meta['CreatedOn'] if Meta['CreatedOn'] else '?'
|
|
Title = '[{}] {}'.format(CreatedOn, Title)
|
|
return Title
|
|
|
|
def FormatTitles(Titles):
|
|
# TODO: Somehow titles written in Pug can end up here and don't work, they should be handled
|
|
MDTitles, DashyTitles = '', []
|
|
for t in Titles:
|
|
n = t.split(' ')[0].count('#')
|
|
Heading = '- ' * n
|
|
Title = t.lstrip('#')
|
|
DashyTitle = DashifyTitle(Title, DashyTitles)
|
|
DashyTitles += [DashyTitle]
|
|
Title = '[{}](#{})'.format(Title, DashyTitle)
|
|
MDTitles += Heading + Title + '\n'
|
|
return markdown(MDTitles)
|
|
|
|
def OrderPages(Old):
|
|
New, NoOrder, Max = [], [], 0
|
|
for i,e in enumerate(Old):
|
|
Curr = e[3]['Order']
|
|
if Curr:
|
|
if Curr > Max:
|
|
Max = Curr
|
|
else:
|
|
NoOrder += [e]
|
|
for i in range(Max+1):
|
|
New += [[]]
|
|
for i,e in enumerate(Old):
|
|
Curr = e[3]['Order']
|
|
if Curr:
|
|
New[Curr] = e
|
|
while [] in New:
|
|
New.remove([])
|
|
return New + NoOrder
|
|
|
|
def CanIndex(Index, For):
|
|
if Index in ('False', 'None'):
|
|
return False
|
|
elif Index in ('True', 'All', 'Unlinked'):
|
|
return True
|
|
else:
|
|
return True if Index == For else False
|
|
|
|
def PatchHTML(File, HTML, PartsText, ContextParts, ContextPartsText, HTMLPagesList, PagePath, Content, Titles, Meta, SiteRoot, SiteName, BlogName, FolderRoots, Categories, SiteLang, Locale):
|
|
HTMLTitles = FormatTitles(Titles)
|
|
BodyDescription, BodyImage = '', ''
|
|
Parse = BeautifulSoup(Content, 'html.parser')
|
|
if not BodyDescription and Parse.p:
|
|
BodyDescription = Parse.p.get_text()[:150].replace('\n', ' ').replace('"', "'") + '...'
|
|
if not BodyImage and Parse.img and Parse.img['src']:
|
|
BodyImage = Parse.img['src']
|
|
|
|
Title = GetTitle(Meta, Titles, 'MetaTitle', BlogName)
|
|
Description = GetDescription(Meta, BodyDescription, 'MetaDescription')
|
|
Image = GetImage(Meta, BodyImage, 'MetaImage')
|
|
|
|
for Line in HTML.splitlines():
|
|
Line = Line.lstrip().rstrip()
|
|
if Line.startswith('[HTML:ContextPart:') and Line.endswith(']'):
|
|
Path = Line[len('[HTML:ContextPart:'):-1]
|
|
Section = Path.split('/')[-1]
|
|
if Section in ContextParts:
|
|
Part = ContextParts[Section]
|
|
Text = ''
|
|
if type(Part) == list:
|
|
for i in Part:
|
|
Text += ContextPartsText['{}/{}'.format(Path, i)] + '\n'
|
|
elif type(Part) == str:
|
|
Text = ContextPartsText['{}/{}'.format(Path, Part)]
|
|
else:
|
|
Text = ''
|
|
HTML = HTML.replace('[HTML:ContextPart:{}]'.format(Path), Text)
|
|
for i in PartsText:
|
|
HTML = HTML.replace('[HTML:Part:{}]'.format(i), PartsText[i])
|
|
HTML = ReplWithEsc(HTML, '[HTML:Site:Menu]', HTMLPagesList)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Page:Lang]', SiteLang)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Page:Chapters]', HTMLTitles)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Page:Title]', Title)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Page:Description]', Description)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Page:Image]', Image)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Page:Path]', PagePath)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Page:Style]', Meta['Style'])
|
|
HTML = ReplWithEsc(HTML, '[HTML:Page:Content]', Content)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Page:ContentHeader]', MakeContentHeader(Meta, Locale, MakeCategoryLine(File, Meta)))
|
|
HTML = ReplWithEsc(HTML, '[HTML:Site:Name]', SiteName)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Site:AbsoluteRoot]', SiteRoot)
|
|
HTML = ReplWithEsc(HTML, '[HTML:Site:RelativeRoot]', GetPathLevels(PagePath))
|
|
for i in FolderRoots:
|
|
HTML = HTML.replace('[HTML:Folder:{}:AbsoluteRoot]'.format(i), FolderRoots[i])
|
|
for i in Categories:
|
|
HTML = HTML.replace('<span>[HTML:Category:{}]</span>'.format(i), Categories[i])
|
|
|
|
# TODO: Clean this doubling?
|
|
ContentHTML = Content
|
|
ContentHTML = ContentHTML.replace('[HTML:Site:AbsoluteRoot]', SiteRoot)
|
|
ContentHTML = ContentHTML.replace('[HTML:Site:RelativeRoot]', GetPathLevels(PagePath))
|
|
for i in FolderRoots:
|
|
ContentHTML = ContentHTML.replace('[HTML:Folder:{}:AbsoluteRoot]'.format(i), FolderRoots[i])
|
|
for i in Categories:
|
|
ContentHTML = ContentHTML.replace('<span>[HTML:Category:{}]</span>'.format(i), Categories[i])
|
|
SlimHTML = HTMLPagesList + ContentHTML
|
|
|
|
return HTML, ContentHTML, SlimHTML, Description, Image
|
|
|
|
def DoMinifyHTML(HTML):
|
|
return htmlmin.minify(
|
|
input=HTML,
|
|
remove_comments=True,
|
|
remove_empty_space=True,
|
|
remove_all_empty_space=False,
|
|
reduce_empty_attributes=True,
|
|
reduce_boolean_attributes=True,
|
|
remove_optional_attribute_quotes=True,
|
|
convert_charrefs=True,
|
|
keep_pre=True)
|
|
|
|
def MakeSite(TemplatesText, PartsText, ContextParts, ContextPartsText, ConfMenu, SiteName, BlogName, SiteTagline, SiteDomain, SiteRoot, FolderRoots, SiteLang, Locale, Minify, NoScripts, Sorting, MarkdownExts, AutoCategories):
|
|
PagesPaths, PostsPaths, Pages, MadePages, Categories = [], [], [], [], {}
|
|
for Ext in FileExtensions['Pages']:
|
|
for File in Path('Pages').rglob('*.{}'.format(Ext)):
|
|
PagesPaths += [FileToStr(File, 'Pages/')]
|
|
for File in Path('Posts').rglob('*.{}'.format(Ext)):
|
|
PostsPaths += [FileToStr(File, 'Posts/')]
|
|
|
|
if Sorting['Pages'] == 'Standard':
|
|
PagesPaths.sort()
|
|
elif Sorting['Pages'] == 'Inverse':
|
|
PagesPaths = RevSort(PagesPaths)
|
|
if Sorting['Posts'] == 'Standard':
|
|
PostsPaths.sort()
|
|
elif Sorting['Posts'] == 'Inverse':
|
|
PostsPaths = RevSort(PostsPaths)
|
|
|
|
print("[I] Preprocessing Source Pages")
|
|
for Type in ['Page', 'Post']:
|
|
if Type == 'Page':
|
|
Files = PagesPaths
|
|
elif Type == 'Post':
|
|
Files = PostsPaths
|
|
for File in Files:
|
|
Content, Titles, Meta = Preprocessor('{}s/{}'.format(Type, File), SiteRoot)
|
|
if Type != 'Page':
|
|
File = Type + 's/' + File
|
|
if not Meta['Type']:
|
|
Meta['Type'] = Type
|
|
Pages += [[File, Content, Titles, Meta]]
|
|
for Cat in Meta['Categories']:
|
|
Categories.update({Cat:''})
|
|
PugCompileList(Pages)
|
|
|
|
if Categories:
|
|
print("[I] Generating Category Lists")
|
|
for Cat in Categories:
|
|
for Type in ('Page', 'Post'):
|
|
Categories[Cat] += GetHTMLPagesList(
|
|
Pages=Pages,
|
|
BlogName=BlogName,
|
|
SiteRoot=SiteRoot,
|
|
PathPrefix=GetPathLevels('Categories/'),
|
|
Type=Type,
|
|
Category=Cat,
|
|
For='Categories',
|
|
MarkdownExts=MarkdownExts)
|
|
|
|
if AutoCategories:
|
|
Dir = 'public/Categories'
|
|
for Cat in Categories:
|
|
Exists = False
|
|
for File in Path(Dir).rglob(str(Cat)+'.*'):
|
|
Exists = True
|
|
break
|
|
if not Exists:
|
|
File = 'Categories/{}.md'.format(Cat)
|
|
FilePath = 'public/{}'.format(File)
|
|
WriteFile(FilePath, """\
|
|
// Title: {Category}
|
|
// Type: Page
|
|
|
|
# {Category}
|
|
|
|
<div><span>[HTML:Category:{Category}]</span></div>
|
|
""".format(Category=Cat))
|
|
Content, Titles, Meta = Preprocessor(FilePath, SiteRoot)
|
|
Pages += [[File, Content, Titles, Meta]]
|
|
|
|
for i,e in enumerate(ConfMenu):
|
|
for File, Content, Titles, Meta in Pages:
|
|
File = StripExt(File)+'.html'
|
|
if e == File:
|
|
ConfMenu[i] = None
|
|
|
|
print("[I] Writing Pages")
|
|
for File, Content, Titles, Meta in Pages:
|
|
HTMLPagesList = GetHTMLPagesList(
|
|
Pages=Pages,
|
|
BlogName=BlogName,
|
|
SiteRoot=SiteRoot,
|
|
PathPrefix=GetPathLevels(File),
|
|
Unite=ConfMenu,
|
|
Type='Page',
|
|
For='Menu',
|
|
MarkdownExts=MarkdownExts)
|
|
PagePath = 'public/{}.html'.format(StripExt(File))
|
|
if File.endswith('.md'):
|
|
Content = markdown(Content, extensions=MarkdownExts)
|
|
elif File.endswith('.pug'):
|
|
Content = ReadFile(PagePath)
|
|
HTML, ContentHTML, SlimHTML, Description, Image = PatchHTML(
|
|
File=File,
|
|
HTML=TemplatesText[Meta['Template']],
|
|
PartsText=PartsText,
|
|
ContextParts=ContextParts,
|
|
ContextPartsText=ContextPartsText,
|
|
HTMLPagesList=HTMLPagesList,
|
|
PagePath=PagePath[len('public/'):],
|
|
Content=Content,
|
|
Titles=Titles,
|
|
Meta=Meta,
|
|
SiteRoot=SiteRoot,
|
|
SiteName=SiteName,
|
|
BlogName=BlogName,
|
|
FolderRoots=FolderRoots,
|
|
Categories=Categories,
|
|
SiteLang=SiteLang,
|
|
Locale=Locale)
|
|
if NoScripts:
|
|
HTML = StripTags(HTML, ['script'])
|
|
if Minify:
|
|
HTML = DoMinifyHTML(HTML)
|
|
WriteFile(PagePath, HTML)
|
|
MadePages += [[File, Content, Titles, Meta, ContentHTML, SlimHTML, Description, Image]]
|
|
|
|
return MadePages
|