forked from AsteriskAmpersand/Carian-Archive
-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathparser.py
132 lines (121 loc) · 4.11 KB
/
parser.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
# -*- coding: utf-8 -*-
"""
Created on Sun Mar 13 01:33:31 2022
@author: Asterisk
"""
import xml.etree.ElementTree as ET
import markdown
from pathlib import Path
npcOverloads = {}
# def loadNPCNames(root):
# path = str(root / r"NPC名.fmg.xml")
# npcNames = loadTextFile(path)
# remapping = {}
# for ids in npcNames:
# if str(ids)[0] == "1":
# remapping[int(str(ids)[1:-1])] = npcNames[ids]
# for key in npcOverloads:
# remapping[key] = npcOverloads[key]
# return remapping
def parseNPCDialogue(path, npcNames = {},output = print):
l_npc = 0
l_section = 0
l_identifier = 0
data = loadTextFile(path)
for identifier in data:
section = l_section
if identifier != l_identifier + 1:
section = section + 1
npc = (identifier//100000)
if npc != l_npc:
if npc in npcNames:
output("### %s [%04d]"%(npcNames[npc],npc))
else:
output("### %04d"%(npc))
l_npc = npc
l_section = -1
section = 0
if section != l_section:
output("#### Section %02d"%section)
l_section = section
if data[identifier]:
output("[%d] "%(identifier) + data[identifier]+" ")
l_identifier = identifier
return
def loadTextFile(path):
tree = ET.parse(path)
root = tree.getroot()
textElements = list(list(root)[3])
elements = {}
for element in textElements:
identifier = int(element.items()[0][1])
text = element.text
if "%null%" not in text:
elements[identifier] = text
return elements
def pairedTextFiles(path0,path1):
merged = {}
l,r = map(loadTextFile,[path0,path1])
for key in l:
if key in r:
merged[key] = (l[key],r[key])
else:
merged[key] = (l[key],"")
for key in r:
if key not in merged:
merged[key] = ("",r[key])
return merged
def singleTextFiles(path):
l = loadTextFile(path)
m = {}
for key in l:
m[key] = ("",l[key])
return m
def loadFromChunk(chunk):
knownPairs = {"FCS名":"FCS説明", # FCS
"アーカイブ名":"アーカイブ内容", # Logs
"ジェネレーター名":"ジェネレーター説明", # Generator
"チュートリアルタイトル":"チュートリアル本文", # Tutorial
"ブースター名":"ブースター説明", # Booster
"武器名":"武器説明", # Weapon
"防具名":"防具説明", # Parts
}
knownPairs = {k+".fmg":t+".fmg" for k,t in knownPairs.items()}
pairTargets = {knownPairs[p]:p for p in knownPairs}
master = []
# npcIds = loadNPCNames(chunk)
duplicates = set()
for file in chunk.rglob("*.xml"):
if "ToS" in file.stem:
continue
if file.stem in knownPairs:
text = pairedTextFiles(str(file),
str(file).replace(file.stem,
knownPairs[file.stem]))
elif file.stem in pairTargets:
continue
else:
text = singleTextFiles(str(file))
master.append("\n\n## %s\n"%file.stem)
if file.stem == "会話.fmg":
parseNPCDialogue(file, {},master.append)
else:
for key,(title,description) in text.items():
if description in duplicates:
continue
duplicates.add(description)
if title:
master.append("\n### %s [%d]"%(title,key))
master.append(description)
else:
master.append("[%d] %s\n"%(key,description))
text = "\n".join(master)
return text
chunk = Path(r".\GameText")
text = loadFromChunk(chunk)
with open("Master.html","w",encoding = "utf8") as outf:
outf.write(markdown.markdown(text))
chunk = Path(r".\GameTextJP")
text = loadFromChunk(chunk)
with open("MasterJP.html","w",encoding = "utf8") as outf:
outf.write(markdown.markdown(text))