1.
一般来说,是的。
2.
我不知道如何合并多个HTML文件,但是这里有一个Python脚本(Github),可以将CSS / JS /图像合并到一个单独的HTML文件中。与Noam Nol的回答相比...
- ... 它没有外部依赖
- ... 它还会正确处理非PNG图像。
用法: python3 htmlmerger yourfile.html
Github上的代码:htmlmerger.py
以下是Github文件的内容。
from html.parser import HTMLParser
import os
import sys
import base64
gHelp = """
Merge JS/CSS/images/HTML into one single file
Version: 1.0
Usage:
htmlmerger inputfile [optional: outputfile]
"""
def getFileContent (strFilepath):
content = ""
with open (strFilepath, "r") as file:
content = file.read ()
return content
def getFileContentBytes (strFilepath):
content = b""
with open (strFilepath, "rb") as file:
content = file.read ()
return content
class HtmlMerger(HTMLParser):
"""
Call "run(htmlContent, basedir)" to merge
script/css/images referenced withing htmlContent
into one single html file.
"""
def __init__(self):
super().__init__()
self._result = ""
self._additionalData = ""
self._baseDir = ""
self.messages = []
def _addMessage_fileNotFound(self, file_asInHtmlFile, file_searchpath):
self.messages.append ("Error: Line " + str (self.getpos ()[0]) +
": Could not find file `" + str (file_asInHtmlFile) +
"`; searched in `" + str (file_searchpath) + "`." )
def _getAttribute (self, attributes, attributeName):
"""Return attribute value or `None`, if not existend"""
for attr in attributes:
key = attr[0]
if (key == attributeName):
return attr[1]
return None
def _getFullFilepath (self, relPath):
return os.path.join (self._baseDir, relPath)
def handle_starttag(self, tag, attrs):
if (tag == "link"):
href = self._getAttribute (attrs, "href")
if (href):
hrefFullPath = self._getFullFilepath (href)
if (not os.path.isfile (hrefFullPath)):
self._addMessage_fileNotFound (href, hrefFullPath)
return
styleContent = getFileContent (hrefFullPath)
self._result += "<style>" + styleContent + "</style>"
return
self._result += "<" + tag + " "
for attr in attrs:
key = attr[0]
value = attr[1]
if (tag == "script" and key == "src"):
strReferencedFile = self._getFullFilepath (value)
if (not os.path.isfile (strReferencedFile)):
self._addMessage_fileNotFound (value, strReferencedFile)
continue
referencedContent = getFileContent (strReferencedFile)
self._additionalData += referencedContent
continue
if (tag == "img" and key == "src"):
imgPathRel = value
imgPathFull = self._getFullFilepath (imgPathRel)
if (not os.path.isfile (imgPathFull)):
self._addMessage_fileNotFound (imgPathRel, imgPathFull)
continue
imageExtension = os.path.splitext (imgPathRel)[1][1:]
imageFormat = imageExtension
image_bytes = getFileContentBytes (imgPathFull)
image_base64 = base64.b64encode (image_bytes)
src_content = "data:image/{};base64, {}".format(imageFormat,image_base64.decode('ascii'))
self._result += "src='" + src_content + "'"
continue
if ('"' in value):
self._result += key + "='" + value + "' "
else:
self._result += key + '="' + value + '" '
self._result += ">"
def _writeAndResetAdditionalData(self):
self._result += self._additionalData
self._additionalData = ""
def handle_endtag(self, tag):
self._writeAndResetAdditionalData ()
self._result += "</" + tag + ">"
def handle_data(self, data):
self._result += data
def run(self, content, basedir):
self._baseDir = basedir
self.feed (content)
return self._result
def merge(strInfile, strOutfile):
if (not os.path.isfile (strInfile)):
print ("FATAL ERROR: file `" + strInfile + "` could not be accessed.")
return
baseDir = os.path.split (os.path.abspath (strInfile))[0]
content = getFileContent (strInfile)
parser = HtmlMerger()
content_changed = parser.run (content, baseDir)
if (len (parser.messages) > 0):
print ("Problems occured")
for msg in parser.messages:
print (" " + msg)
print ("")
if (False):
print (content_changed)
exit ()
with open (strOutfile, "w") as file:
file.write (content_changed)
def main():
args = sys.argv[1:]
if (len (args) < 1):
print (gHelp)
exit()
inputFile = args[0]
outputFile = ""
if (True):
outputFile = os.path.splitext (inputFile)[0] + "_merged.html"
if (len (args) > 1):
outputFile = args[1]
if (os.path.isfile (outputFile)):
print ("FATAL ERROR: Output file " + outputFile + " does already exist")
exit ()
merge (inputFile, outputFile)
main()
<style>
放在<head>
中,而将<script>
放在结尾位置(但仍在<body>
内部)。 - marcellothearcane