Skip to content

Commit e13773d

Browse files
committedJun 19, 2014
Fix chapter links when exporting XML.
1 parent 604b1e7 commit e13773d

File tree

4 files changed

+82
-5
lines changed

4 files changed

+82
-5
lines changed
 

‎.gitignore

+3-1
Original file line numberDiff line numberDiff line change
@@ -3,4 +3,6 @@ code/flyweight/tiles/Build/
33
.sass-cache/
44
xcuserdata/
55
*.xcuserstate
6-
project.xcworkspace/
6+
project.xcworkspace/
7+
8+
xml/

‎asset/template.xml

+16
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,16 @@
1+
<?xml version="1.0" standalone="yes" ?>
2+
<!DOCTYPE chapter [
3+
<!ENTITY mdash "&#8212;"> <!-- em dash, U+2014 ISOpub -->
4+
<!ENTITY lsquo "&#8216;"> <!-- left single quotation mark,
5+
U+2018 ISOnum -->
6+
<!ENTITY rsquo "&#8217;"> <!-- right single quotation mark,
7+
U+2019 ISOnum -->
8+
<!ENTITY sbquo "&#8218;"> <!-- single low-9 quotation mark, U+201A NEW -->
9+
<!ENTITY ldquo "&#8220;"> <!-- left double quotation mark,
10+
U+201C ISOnum -->
11+
<!ENTITY rdquo "&#8221;"> <!-- right double quotation mark,
12+
U+201D ISOnum -->
13+
]>
14+
<chapter>
15+
{{body}}
16+
</chapter>

‎note/print workflow.txt

+19
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,19 @@
1+
- Export to XML
2+
- Import XML
3+
- Place it in main text flow
4+
- Untag everything and remove the story structure
5+
- Pull out asides and restyle
6+
- Change first paragraph body text styles
7+
- Set chapter title and number on first page
8+
- Update section in running footer
9+
- Clean up
10+
- Make sure there aren't bits of 14.4pt line height
11+
- Fix prose references to hyperlinks to make them make sense
12+
- Add illustrations
13+
- Make 600 dpi bitmap
14+
- Save to Print/Illustrations/...
15+
- Place
16+
- Make inline anchor
17+
- Set Position to "Above Line" with 9pts of space before and 4.5pts after
18+
- Add a caption
19+
- Position asides

‎script/format.py

+44-4
Original file line numberDiff line numberDiff line change
@@ -51,6 +51,32 @@
5151
"Spatial Partition"
5252
]
5353

54+
# URLs for hyperlinks to chapters. Note that the order is significant here.
55+
# The index in this list + 1 is the chapter's number in the table of contents.
56+
CHAPTER_HREFS = [
57+
"introduction.html",
58+
"architecture-performance-and-games.html",
59+
"command.html",
60+
"flyweight.html",
61+
"observer.html",
62+
"prototype.html",
63+
"singleton.html",
64+
"state.html",
65+
"double-buffer.html",
66+
"game-loop.html",
67+
"update-method.html",
68+
"bytecode.html",
69+
"subclass-sandbox.html",
70+
"type-object.html",
71+
"component.html",
72+
"event-queue.html",
73+
"service-locator.html",
74+
"data-locality.html",
75+
"dirty-flag.html",
76+
"object-pool.html",
77+
"spatial-partition.html"
78+
]
79+
5480
num_chapters = 0
5581
empty_chapters = 0
5682
total_words = 0
@@ -121,7 +147,7 @@ def format_file(path, nav, skip_up_to_date):
121147
else:
122148
print "UNKNOWN COMMAND:", command, args
123149

124-
elif stripped.startswith('#'):
150+
elif extension != "xml" and stripped.startswith('#'):
125151
# Build the page navigation from the headers.
126152
index = stripped.find(" ")
127153
headertype = stripped[:index]
@@ -230,10 +256,24 @@ def clean_up_code_xml(code):
230256

231257
return code
232258

259+
def fix_link(match):
260+
tag = match.group(1)
261+
contents = match.group(2)
262+
href = re.search(r'href\s*=\s*"([^"]+)"', tag).group(1)
263+
264+
# If it's not a link to a chapter, just return the contents of the link and
265+
# strip out the link itself.
266+
if not href in CHAPTER_HREFS:
267+
return contents
268+
269+
# Turn it into a chapter number reference.
270+
return "{}<chap-ref> ({})</chap-ref>".format(
271+
contents, CHAPTER_HREFS.index(href) + 1)
272+
233273
def clean_up_xhtml(html):
234-
# Remove links.
235-
html = re.sub(r"<a\s[^>]+>", "", html)
236-
html = re.sub(r"</a>", "", html)
274+
# Replace chapter links with chapter number references and remove other
275+
# links.
276+
html = re.sub(r"<a\s+([^>]+)>([^<]+)</a>", fix_link, html)
237277

238278
# Ditch newlines in the middle of blocks of text. Out of sheer malice,
239279
# even though they are meaningless in actual XML, InDesign treats them

0 commit comments

Comments
 (0)
Please sign in to comment.