1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
|
# Copyright (C) 2013 Lars Wirzenius
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License along
# with this program; if not, write to the Free Software Foundation, Inc.,
# 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
'''Simplistic text re-formatter.
This module format text, paragraph by paragraph, so it is somewhat
nice-looking, with no line too long, and short lines joined. In
other words, like what the textwrap library does. However, it
extends textwrap by recognising bulleted lists.
'''
import textwrap
class Paragraph(object):
def __init__(self):
self._lines = []
def append(self, line):
self._lines.append(line)
def _oneliner(self):
return ' '.join(' '.join(x.split()) for x in self._lines)
def fill(self, width):
filled = textwrap.fill(self._oneliner(), width=width)
return filled
class BulletPoint(Paragraph):
def fill(self, width):
text = self._oneliner()
assert text.startswith('* ')
filled = textwrap.fill(text[2:], width=width - 2)
lines = [' %s' % x for x in filled.splitlines(True)]
lines[0] = '* %s' % lines[0][2:]
return ''.join(lines)
class EmptyLine(Paragraph):
def fill(self, width):
return ''
class TextFormat(object):
def __init__(self, width=78):
self._width = width
def format(self, text):
'''Return input string, but formatted nicely.'''
filled_paras = []
for para in self._paragraphs(text):
filled_paras.append(para.fill(self._width))
filled = '\n'.join(filled_paras)
if text and not filled.endswith('\n'):
filled += '\n'
return filled
def _paragraphs(self, text):
def is_empty(line):
return line.strip() == ''
def is_bullet(line):
return line.startswith('* ')
def is_continuation(line):
return line.startswith(' ')
current = None
in_list = False
for line in text.splitlines(True):
if in_list and is_continuation(line):
assert current is not None
current.append(line)
elif is_bullet(line):
if current:
yield current
if not in_list:
yield EmptyLine()
current = BulletPoint()
current.append(line)
in_list = True
elif is_empty(line):
if current:
yield current
yield EmptyLine()
current = None
in_list = False
else:
if in_list:
yield current
yield EmptyLine()
current = None
if not current:
current = Paragraph()
current.append(line)
in_list = False
if current:
yield current
|