Step 1: run so-splitter-Posts.py (config: srcPath, dstPath, tagsPattern)
Step 2: run so-splitter-PostLinks.py (config: srcPath, dstPath)
import mammoth | |
from zipfile import BadZipFile | |
import os | |
path='E:/dc/data/docx' | |
html_path='E:/dc/data/html' | |
def gci(filepath): | |
files = os.listdir(filepath) | |
for fi in files: |
Step 1: run so-splitter-Posts.py (config: srcPath, dstPath, tagsPattern)
Step 2: run so-splitter-PostLinks.py (config: srcPath, dstPath)