staticoso/Source/Build.py

377 lines
15 KiB
Python
Raw Normal View History

2022-05-16 20:12:06 +02:00
#!/usr/bin/env python3
""" ================================= |
| This file is part of |
| staticoso |
| Just a simple Static Site Generator |
2022-05-21 20:03:27 +02:00
| |
| Licensed under the AGPLv3 license |
| Copyright (C) 2022, OctoSpacc |
| ================================= """
2022-05-17 18:16:39 +02:00
2022-05-24 00:22:32 +02:00
import argparse
2022-05-16 20:12:06 +02:00
import os
import shutil
2022-08-28 00:32:45 +02:00
import time
2022-06-07 13:42:32 +02:00
from ast import literal_eval
2022-06-24 20:00:38 +02:00
from datetime import datetime
from pathlib import Path
2022-07-11 17:28:59 +02:00
from Modules.Config import *
2022-06-29 00:17:52 +02:00
from Modules.Gemini import *
from Modules.Globals import *
from Modules.Logging import *
2022-07-14 20:38:45 +02:00
from Modules.Markdown import *
from Modules.Site import *
2022-07-13 17:40:09 +02:00
from Modules.Sitemap import *
from Modules.Utils import *
2022-10-17 09:19:07 +02:00
try:
from Modules.ActivityPub import *
ActivityPub = True
except:
logging.warning("⚠ Can't load the ActivityPub module. Its use is disabled. Make sure the 'requests' library is installed.")
ActivityPub = False
2022-11-05 12:17:23 +01:00
from Libs import rcssmin
cssmin = rcssmin._make_cssmin(python_only=True)
2022-10-17 09:19:07 +02:00
2022-08-30 16:31:33 +02:00
def ResetOutDir(OutDir):
2022-08-27 16:50:50 +02:00
for e in (OutDir, f"{OutDir}.gmi"):
2022-06-29 00:17:52 +02:00
try:
2022-08-27 16:50:50 +02:00
shutil.rmtree(e)
2022-06-29 00:17:52 +02:00
except FileNotFoundError:
pass
2022-05-16 20:12:06 +02:00
2022-08-27 16:50:50 +02:00
def DelTmp(OutDir):
for Ext in FileExtensions['Tmp']:
2022-08-27 16:50:50 +02:00
for File in Path(OutDir).rglob(f"*.{Ext}"):
os.remove(File)
2022-08-27 16:50:50 +02:00
for Dir in (OutDir, f"{OutDir}.gmi"):
for File in Path(Dir).rglob('*.tmp'):
os.remove(File)
2022-06-23 17:20:06 +02:00
def SetSorting(Sorting):
Default = {
'Pages':'Standard',
'Posts':'Inverse'}
for i in Default:
if i not in Sorting:
Sorting.update({i:Default[i]})
return Sorting
2022-07-15 16:48:18 +02:00
def GetConfMenu(Entries, MarkdownExts):
2022-07-11 17:28:59 +02:00
if Entries:
Menu, Max = [], 0
for i in Entries:
if int(i) > Max:
Max = int(i)
Menu = [None] * (Max+1)
2022-07-11 17:28:59 +02:00
for i in Entries:
e = Entries[i]
2022-07-28 23:33:13 +02:00
if not ((e.startswith('<') or e.startswith('[') or e.startswith('- ')) and (e.endswith('>') or e.endswith(')') or e.endswith('}'))):
2022-08-14 18:26:18 +02:00
if not e.lower().endswith(FileExtensions['HTML']):
2022-07-15 00:12:58 +02:00
e += '.html'
2022-07-15 16:48:18 +02:00
Menu[int(i)] = e
2022-07-11 17:28:59 +02:00
return Menu
2022-08-30 16:31:33 +02:00
def CheckSafeOutDir(OutDir):
InDir = os.path.realpath(os.getcwd())
OutDir = os.path.realpath(OutDir)
OutFolder = OutDir.split('/')[-1]
if InDir == OutDir:
logging.error(f"⛔ Output and Input directories ({OutDir}) can't be the same. Exiting.")
exit(1)
elif OutFolder in ReservedPaths and f"{InDir}/{OutFolder}" == OutDir:
logging.error(f"⛔ Output directory {OutDir} can't be a reserved subdirectory of the Input. Exiting.")
exit(1)
2022-08-27 16:50:50 +02:00
def GetModifiedFiles(OutDir):
All, Mod = [], []
for Path in ('Pages', 'Posts'):
for Root, Dirs, Files in os.walk(Path):
for File in Files:
Src = os.path.join(Root,File)
SrcTime = int(os.path.getmtime(Src))
if Path == 'Pages':
Tmp = '/'.join(Src.split('/')[1:])
elif Path == 'Posts':
Tmp = Src
Obj = f"{OutDir}/{StripExt(Tmp)}.html"
try:
ObjTime = int(os.path.getmtime(Obj))
except FileNotFoundError:
ObjTime = 0
All += [{'Tmp':Tmp, 'SrcTime':SrcTime, 'ObjTime':ObjTime}]
for File in All:
if File['SrcTime'] > File['ObjTime']:
Mod += [File['Tmp']]
return Mod
def WriteRedirects(Flags, Pages, FinalPaths, Locale):
OutDir, SiteName, SiteDomain = Flags['OutDir'], Flags['SiteName'], Flags['SiteDomain']
for File, Content, Titles, Meta, ContentHTML, SlimHTML, Description, Image in Pages:
for URL in Meta['URLs']:
DestFile = f"{OutDir}/{URL}"
if DestFile not in FinalPaths:
DestURL = f"{GetPathLevels(URL)}{StripExt(File)}.html"
mkdirps(os.path.dirname(DestFile))
WriteFile(DestFile, RedirectPageTemplate.format(
SiteDomain=SiteDomain,
DestURL=DestURL,
TitlePrefix=f"{SiteName} - " if SiteName else '',
StrClick=Locale['ClickHere'],
StrRedirect=Locale['IfNotRedirected']))
def Main(Args, FeedEntries):
Flags, Snippets, FinalPaths = {}, {}, []
2022-07-11 17:28:59 +02:00
HavePages, HavePosts = False, False
2022-07-28 16:27:37 +02:00
SiteConf = LoadConfFile('Site.ini')
2022-07-11 17:28:59 +02:00
2022-10-29 18:24:36 +02:00
#ConfigLogging(DefConfOptChoose('Logging', Args.Logging, ReadConf(SiteConf, 'staticoso', 'Logging')))
2022-08-27 16:50:50 +02:00
#if Args.InputDir:
# os.chdir(Args.InputDir)
# print(f"[I] Current directory: {Args.InputDir}")
2022-10-19 11:27:51 +02:00
SiteName = Flags['SiteName'] = OptChoose('', Args.SiteName, ReadConf(SiteConf, 'Site', 'Name'))
if SiteName:
logging.info(f"Compiling: {SiteName}")
2022-10-19 11:27:51 +02:00
OutDir = Flags['OutDir'] = DefConfOptChoose('OutDir', Args.OutputDir, ReadConf(SiteConf, 'Site', 'OutputDir'))
2022-08-30 16:31:33 +02:00
OutDir = Flags['OutDir'] = OutDir.removesuffix('/')
CheckSafeOutDir(OutDir)
logging.info(f"Outputting to: {OutDir}/")
Threads = Args.Threads if Args.Threads else DefConf['Threads']
DiffBuild = Args.DiffBuild if Args.DiffBuild else DefConf['DiffBuild']
2022-08-31 00:18:23 +02:00
2022-10-19 11:27:51 +02:00
BlogName = Flags['BlogName'] = OptChoose('', Args.BlogName, ReadConf(SiteConf, 'Site', 'BlogName'))
SiteTagline = Flags['SiteTagline'] = OptChoose('', Args.SiteTagline, ReadConf(SiteConf, 'Site', 'Tagline'))
SiteTemplate = Flags['SiteTemplate'] = DefConfOptChoose('SiteTemplate', Args.SiteTemplate, ReadConf(SiteConf, 'Site', 'Template'))
SiteDomain = Flags['SiteDomain'] = OptChoose('', Args.SiteDomain, ReadConf(SiteConf, 'Site', 'Domain'))
SiteRoot = Flags['SiteRoot'] = OptChoose('/', Args.SiteRoot, ReadConf(SiteConf, 'Site', 'Root'))
SiteLang = Flags['SiteLang'] = DefConfOptChoose('SiteLang', Args.SiteLanguage, ReadConf(SiteConf, 'Site', 'Language'))
2022-10-19 11:27:51 +02:00
Sorting = Flags['Sorting'] = literal_eval(OptChoose('{}', Args.Sorting, ReadConf(SiteConf, 'Site', 'Sorting')))
2022-08-30 21:10:45 +02:00
Sorting = Flags['Sorting'] = SetSorting(Sorting)
2022-10-19 11:27:51 +02:00
NoScripts = Flags['NoScripts'] = StrBoolChoose(False, Args.NoScripts, ReadConf(SiteConf, 'Site', 'NoScripts'))
2022-08-30 21:10:45 +02:00
FolderRoots = Flags['FolderRoots'] = literal_eval(Args.FolderRoots) if Args.FolderRoots else {}
2022-10-19 11:27:51 +02:00
ActivityPubTypeFilter = Flags['ActivityPubTypeFilter'] = DefConfOptChoose('ActivityPubTypeFilter', Args.ActivityPubTypeFilter, ReadConf(SiteConf, 'ActivityPub', 'TypeFilter'))
ActivityPubHoursLimit = Flags['ActivityPubHoursLimit'] = DefConfOptChoose('ActivityPubHoursLimit', Args.ActivityPubHoursLimit, ReadConf(SiteConf, 'ActivityPub', 'HoursLimit'))
2022-10-19 11:27:51 +02:00
MastodonURL = Flags['MastodonURL'] = OptChoose('', Args.MastodonURL, ReadConf(SiteConf, 'Mastodon', 'URL'))
MastodonToken = Flags['MastodonToken'] = OptChoose('', Args.MastodonToken, ReadConf(SiteConf, 'Mastodon', 'Token'))
2022-08-30 16:31:33 +02:00
MarkdownExts = Flags['MarkdownExts'] = literal_eval(OptionChoose(str(MarkdownExtsDefault), Args.MarkdownExts, ReadConf(SiteConf, 'Markdown', 'Exts')))
2022-10-19 11:27:51 +02:00
SitemapOutput = Flags['SitemapOutput'] = StrBoolChoose(True, Args.SitemapOutput, ReadConf(SiteConf, 'Sitemap', 'Output'))
2022-11-05 12:17:23 +01:00
MinifyOutput = Flags['MinifyOutput'] = StrBoolChoose(False, Args.MinifyOutput, ReadConf(SiteConf, 'Minify', 'Output'))
MinifyAssets = Flags['MinifyAssets'] = StrBoolChoose(False, Args.MinifyAssets, ReadConf(SiteConf, 'Minify', 'Assets'))
2022-10-19 11:27:51 +02:00
MinifyKeepComments = Flags['MinifyKeepComments'] = StrBoolChoose(False, Args.MinifyKeepComments, ReadConf(SiteConf, 'Minify', 'KeepComments'))
2022-10-19 11:27:51 +02:00
ImgAltToTitle = Flags['ImgAltToTitle'] = StrBoolChoose(True, Args.ImgAltToTitle, ReadConf(SiteConf, 'Site', 'ImgAltToTitle'))
ImgTitleToAlt = Flags['ImgTitleToAlt'] = StrBoolChoose(False, Args.ImgTitleToAlt, ReadConf(SiteConf, 'Site', 'ImgTitleToAlt'))
HTMLFixPre = Flags['HTMLFixPre'] = StrBoolChoose(False, Args.HTMLFixPre, ReadConf(SiteConf, 'Site', 'HTMLFixPre'))
2022-10-19 11:27:51 +02:00
CategoriesAutomatic = Flags['CategoriesAutomatic'] = StrBoolChoose(False, Args.CategoriesAutomatic, ReadConf(SiteConf, 'Categories', 'Automatic'))
CategoriesUncategorized = Flags['CategoriesUncategorized'] = DefConfOptChoose('CategoriesUncategorized', Args.CategoriesUncategorized, ReadConf(SiteConf, 'Categories', 'Uncategorized'))
2022-10-19 11:27:51 +02:00
GemtextOutput = Flags['GemtextOutput'] = StrBoolChoose(False, Args.GemtextOutput, ReadConf(SiteConf, 'Gemtext', 'Output'))
2022-08-30 16:31:33 +02:00
GemtextHeader = Flags['GemtextHeader'] = Args.GemtextHeader if Args.GemtextHeader else ReadConf(SiteConf, 'Gemtext', 'Header') if ReadConf(SiteConf, 'Gemtext', 'Header') else f"# {SiteName}\n\n" if SiteName else ''
2022-10-19 11:27:51 +02:00
FeedCategoryFilter = Flags['FeedCategoryFilter'] = DefConfOptChoose('FeedCategoryFilter', Args.FeedCategoryFilter, ReadConf(SiteConf, 'Feed', 'CategoryFilter'))
FeedEntries = Flags['FeedEntries'] = int(FeedEntries) if (FeedEntries or FeedEntries == 0) and FeedEntries != 'Default' else int(ReadConf(SiteConf, 'Feed', 'Entries')) if ReadConf(SiteConf, 'Feed', 'Entries') else DefConf['FeedEntries']
2022-07-25 16:11:39 +02:00
JournalRedirect = Flags["JournalRedirect"] = StrBoolChoose(DefConf["JournalRedirect"], Args.JournalRedirect, ReadConf(SiteConf, 'Journal', 'Redirect'))
2022-08-30 21:10:45 +02:00
DynamicParts = Flags['DynamicParts'] = literal_eval(OptionChoose('{}', Args.DynamicParts, ReadConf(SiteConf, 'Site', 'DynamicParts')))
DynamicPartsText = Snippets['DynamicParts'] = LoadFromDir('DynamicParts', ['*.htm', '*.html'])
StaticPartsText = Snippets['StaticParts'] = LoadFromDir('StaticParts', ['*.htm', '*.html'])
TemplatesText = Snippets['Templates'] = LoadFromDir('Templates', ['*.htm', '*.html'])
2022-07-25 17:06:16 +02:00
MenuEntries = ReadConf(SiteConf, 'Menu')
if MenuEntries:
ConfMenu = GetConfMenu(MenuEntries, MarkdownExts)
2022-07-15 16:48:18 +02:00
else:
ConfMenu = []
2022-08-30 16:31:33 +02:00
SiteDomain = Flags['SiteDomain'] = SiteDomain.removesuffix('/')
Locale = LoadLocale(SiteLang)
if DiffBuild:
logging.info("Build mode: Differential")
2022-08-30 16:31:33 +02:00
LimitFiles = GetModifiedFiles(OutDir)
else:
logging.info("Build mode: Clean")
2022-08-30 16:31:33 +02:00
ResetOutDir(OutDir)
2022-08-28 00:32:45 +02:00
LimitFiles = False
2022-07-11 17:28:59 +02:00
if os.path.isdir('Pages'):
2022-07-11 17:28:59 +02:00
HavePages = True
2022-08-30 16:31:33 +02:00
shutil.copytree('Pages', OutDir, dirs_exist_ok=True)
if Flags['GemtextOutput']:
shutil.copytree('Pages', f"{OutDir}.gmi", ignore=IgnoreFiles, dirs_exist_ok=True)
if os.path.isdir('Posts'):
2022-07-11 17:28:59 +02:00
HavePosts = True
2022-08-30 16:31:33 +02:00
shutil.copytree('Posts', f"{OutDir}/Posts", dirs_exist_ok=True)
if Flags['GemtextOutput']:
shutil.copytree('Posts', f"{OutDir}.gmi/Posts", ignore=IgnoreFiles, dirs_exist_ok=True)
2022-06-24 17:19:22 +02:00
if not (HavePages or HavePosts):
logging.error("⛔ No Pages or posts found. Nothing to do, exiting!")
2022-08-14 00:35:45 +02:00
exit(1)
2022-07-11 17:28:59 +02:00
logging.info("Generating HTML")
2022-06-24 20:00:38 +02:00
Pages = MakeSite(
2022-08-30 16:31:33 +02:00
Flags=Flags,
2022-08-27 16:50:50 +02:00
LimitFiles=LimitFiles,
2022-08-30 21:10:45 +02:00
Snippets=Snippets,
2022-07-15 16:48:18 +02:00
ConfMenu=ConfMenu,
2022-07-28 23:13:47 +02:00
GlobalMacros=ReadConf(SiteConf, 'Macros'),
Locale=Locale,
Threads=Threads)
2022-06-24 17:19:22 +02:00
if FeedEntries != 0:
logging.info("Generating Feeds")
for FeedType in (True, False):
2022-08-30 16:31:33 +02:00
MakeFeed(Flags, Pages, FeedType)
2022-07-13 17:40:09 +02:00
2022-07-02 22:09:09 +02:00
if ActivityPub and MastodonURL and MastodonToken and SiteDomain:
logging.info("Mastodon Stuff")
2022-08-30 16:31:33 +02:00
MastodonPosts = MastodonShare(Flags, Pages, Locale)
else:
MastodonPosts = []
2022-07-01 17:29:37 +02:00
for File, Content, Titles, Meta, ContentHTML, SlimHTML, Description, Image in Pages:
if IsLightRun(File, LimitFiles):
continue
2022-08-30 16:31:33 +02:00
File = f"{OutDir}/{StripExt(File)}.html"
Content = ReadFile(File)
Post = ''
for p in MastodonPosts:
2022-08-30 16:31:33 +02:00
if p['Link'] == SiteDomain + '/' + File[len(f"{OutDir}/"):]:
Post = HTMLCommentsBlock.format(
StrComments=Locale['Comments'],
StrOpen=Locale['OpenInNewTab'],
URL=p['Post'])
break
Content = ReplWithEsc(Content, '[staticoso:Comments]', Post)
Content = ReplWithEsc(Content, '<staticoso:Comments>', Post)
WriteFile(File, Content)
FinalPaths += [File]
logging.debug("Creating Redirects")
WriteRedirects(Flags, Pages, FinalPaths, Locale)
2022-08-30 16:31:33 +02:00
if Flags['GemtextOutput']:
logging.info("Generating Gemtext")
2022-08-30 16:31:33 +02:00
GemtextCompileList(Flags, Pages, LimitFiles)
2022-06-29 00:17:52 +02:00
logging.info("Cleaning Temporary Files")
2022-08-30 16:31:33 +02:00
DelTmp(OutDir)
2022-08-30 16:31:33 +02:00
if Flags['SitemapOutput']:
logging.info("Generating Sitemap")
2022-08-30 16:31:33 +02:00
MakeSitemap(Flags, Pages)
2022-11-05 12:17:23 +01:00
logging.info("Preparing Assets")
#os.system(f"cp -R Assets/* {OutDir}/")
if Flags['MinifyAssets']:
shutil.copytree('Assets', OutDir, ignore=IgnoreFiles, dirs_exist_ok=True)
for File in Path('Assets').rglob('*'):
if os.path.isfile(File):
Dest = f"{OutDir}/{str(File)[len('Assets')+1:]}"
if str(File).lower().endswith(FileExtensions['HTML']):
WriteFile(Dest, DoMinifyHTML(ReadFile(File), MinifyKeepComments))
elif str(File).lower().endswith('.css'):
WriteFile(Dest, cssmin(ReadFile(File), MinifyKeepComments))
else:
shutil.copy2(File, Dest)
else:
shutil.copytree('Assets', OutDir, dirs_exist_ok=True)
2022-07-11 17:28:59 +02:00
#def DoSiteBuild(Arg=None):
# #try:
# # SiteEditObserver.stop()
# # SiteEditObserver.join()
# #except:
# # pass
# Main(Args=Args, FeedEntries=FeedEntries)
# logging.info(f"✅ Done! ({round(time.time()-StartTime, 3)}s)")
# #SiteEditObserver.start()
2022-05-16 20:12:06 +02:00
if __name__ == '__main__':
2022-08-30 16:31:33 +02:00
StartTime = time.time()
2022-05-24 00:22:32 +02:00
Parser = argparse.ArgumentParser()
Parser.add_argument('--Logging', type=str) # Levels: Debug, Info, Warning, Error.
Parser.add_argument('--Threads', type=str) # Set 0 to use all CPU cores
Parser.add_argument('--DiffBuild', type=str)
Parser.add_argument('--OutputDir', type=str)
2022-08-27 16:50:50 +02:00
#Parser.add_argument('--InputDir', type=str)
2022-06-23 17:20:06 +02:00
Parser.add_argument('--Sorting', type=str)
Parser.add_argument('--SiteLang', type=str) # DEPRECATED
Parser.add_argument('--SiteLanguage', type=str)
Parser.add_argument('--SiteRoot', type=str)
2022-06-24 17:19:22 +02:00
Parser.add_argument('--SiteName', type=str)
2022-07-11 22:56:42 +02:00
Parser.add_argument('--BlogName', type=str)
Parser.add_argument('--SiteTemplate', type=str)
2022-06-24 17:19:22 +02:00
Parser.add_argument('--SiteDomain', type=str)
2022-11-05 12:17:23 +01:00
Parser.add_argument('--MinifyOutput', type=str)
Parser.add_argument('--MinifyAssets', type=str)
Parser.add_argument('--MinifyKeepComments', type=str)
2022-07-25 16:11:39 +02:00
Parser.add_argument('--NoScripts', type=str)
Parser.add_argument('--ImgAltToTitle', type=str)
Parser.add_argument('--ImgTitleToAlt', type=str)
Parser.add_argument('--HTMLFixPre', type=str)
Parser.add_argument('--GemtextOutput', type=str)
Parser.add_argument('--GemtextHeader', type=str)
2022-06-24 17:19:22 +02:00
Parser.add_argument('--SiteTagline', type=str)
Parser.add_argument('--SitemapOutput', type=str)
Parser.add_argument('--JournalRedirect', type=str)
2022-08-14 00:35:45 +02:00
Parser.add_argument('--FeedEntries', type=str)
2022-06-19 23:07:23 +02:00
Parser.add_argument('--FolderRoots', type=str)
Parser.add_argument('--DynamicParts', type=str)
Parser.add_argument('--MarkdownExts', type=str)
Parser.add_argument('--MastodonURL', type=str)
Parser.add_argument('--MastodonToken', type=str)
Parser.add_argument('--FeedCategoryFilter', type=str)
Parser.add_argument('--ActivityPubTypeFilter', type=str, help=argparse.SUPPRESS)
2022-07-18 18:32:25 +02:00
Parser.add_argument('--ActivityPubHoursLimit', type=int)
Parser.add_argument('--CategoriesAutomatic', type=str)
Parser.add_argument('--CategoriesUncategorized', type=str)
Args = Parser.parse_args()
ConfigLogging(Args.Logging)
try:
import lxml
from Modules.Feed import *
2022-08-14 00:35:45 +02:00
FeedEntries = Args.FeedEntries if Args.FeedEntries else 'Default'
except:
logging.warning("⚠ Can't load the XML libraries. XML Feeds Generation is Disabled. Make sure the 'lxml' library is installed.")
FeedEntries = 0
#from watchdog.observers import Observer
#from watchdog.events import LoggingEventHandler
#SiteEditEvent = LoggingEventHandler()
#SiteEditEvent.on_created = DoSiteBuild
#SiteEditEvent.on_deleted = DoSiteBuild
#SiteEditEvent.on_modified = DoSiteBuild
#SiteEditEvent.on_moved = DoSiteBuild
#SiteEditObserver = Observer()
#SiteEditObserver.schedule(SiteEditEvent, ".", recursive=True)
#SiteEditObserver.start()
Main(Args=Args, FeedEntries=FeedEntries)
logging.info(f"✅ Done! ({round(time.time()-StartTime, 3)}s)")
#DoSiteBuild()
#try:
# while True:
# pass
#except KeyboardInterrupt:
# logging.info("Stopped.")
#finally:
# SiteEditObserver.stop()
# SiteEditObserver.join()