summaryrefslogtreecommitdiff
path: root/tools/docs/docload.py
diff options
context:
space:
mode:
authorMagnus Hagander2016-11-16 12:00:50 +0000
committerMagnus Hagander2016-11-16 12:00:50 +0000
commitab0ee308818f8d04b8a2bb0d472334598265a004 (patch)
treefb15d4989a27cfadc889f65c63ff8e38f1012204 /tools/docs/docload.py
parentc5d162dee737518c983d81ab95b05b08a496210c (diff)
Support loading docs in utf-8 from pg version 10
Diffstat (limited to 'tools/docs/docload.py')
-rwxr-xr-xtools/docs/docload.py12
1 files changed, 11 insertions, 1 deletions
diff --git a/tools/docs/docload.py b/tools/docs/docload.py
index faf1892e..12b26957 100755
--- a/tools/docs/docload.py
+++ b/tools/docs/docload.py
@@ -29,7 +29,17 @@ def load_doc_file(filename, f):
indent='auto',
)
- contents = unicode(f.read(),'latin1')
+ # Postgres 10 started using xml toolchain and now produces docmentation in utf8. So we need
+ # to figure out which version it is.
+ rawcontents = f.read()
+ if rawcontents.startswith('<?xml version="1.0" encoding="UTF-8"'):
+ # Version 10, use utf8
+ encoding = 'utf-8'
+ else:
+ encoding = 'latin1'
+
+ contents = unicode(rawcontents, encoding)
+
tm = re_titlematch.search(contents)
if tm:
title = tm.group(1)