third_party/Python-Markdown/markdown/treeprocessors.py - Issue 1389543003: Revert of Check in a simple pure-python based Markdown previewer.

Side by Side Diff: third_party/Python-Markdown/markdown/treeprocessors.py

Issue 1389543003: Revert of Check in a simple pure-python based Markdown previewer. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@add

Patch Set: Created 5 years, 2 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

OLD	NEW
	(Empty)
1 from __future__ import unicode_literals

2 from __future__ import absolute_import

3 from . import util

4 from . import odict

5 from . import inlinepatterns

6

7

8 def build_treeprocessors(md_instance, **kwargs):

9 """ Build the default treeprocessors for Markdown. """

10 treeprocessors = odict.OrderedDict()

11 treeprocessors["inline"] = InlineProcessor(md_instance)

12 treeprocessors["prettify"] = PrettifyTreeprocessor(md_instance)

13 return treeprocessors

14

15

16 def isString(s):

17 """ Check if it's string """

18 if not isinstance(s, util.AtomicString):

19 return isinstance(s, util.string_type)

20 return False

21

22

23 class Treeprocessor(util.Processor):

24 """

25 Treeprocessors are run on the ElementTree object before serialization.

26

27 Each Treeprocessor implements a "run" method that takes a pointer to an

28 ElementTree, modifies it as necessary and returns an ElementTree

29 object.

30

31 Treeprocessors must extend markdown.Treeprocessor.

32

33 """

34 def run(self, root):

35 """

36 Subclasses of Treeprocessor should implement a `run` method, which

37 takes a root ElementTree. This method can return another ElementTree

38 object, and the existing root ElementTree will be replaced, or it can

39 modify the current tree and return None.

40 """

41 pass # pragma: no cover

42

43

44 class InlineProcessor(Treeprocessor):

45 """

46 A Treeprocessor that traverses a tree, applying inline patterns.

47 """

48

49 def __init__(self, md):

50 self.__placeholder_prefix = util.INLINE_PLACEHOLDER_PREFIX

51 self.__placeholder_suffix = util.ETX

52 self.__placeholder_length = 4 + len(self.__placeholder_prefix) \

53 + len(self.__placeholder_suffix)

54 self.__placeholder_re = util.INLINE_PLACEHOLDER_RE

55 self.markdown = md

56 self.inlinePatterns = md.inlinePatterns

57

58 def __makePlaceholder(self, type):

59 """ Generate a placeholder """

60 id = "%04d" % len(self.stashed_nodes)

61 hash = util.INLINE_PLACEHOLDER % id

62 return hash, id

63

64 def __findPlaceholder(self, data, index):

65 """

66 Extract id from data string, start from index

67

68 Keyword arguments:

69

70 * data: string

71 * index: index, from which we start search

72

73 Returns: placeholder id and string index, after the found placeholder.

74

75 """

76 m = self.__placeholder_re.search(data, index)

77 if m:

78 return m.group(1), m.end()

79 else:

80 return None, index + 1

81

82 def __stashNode(self, node, type):

83 """ Add node to stash """

84 placeholder, id = self.__makePlaceholder(type)

85 self.stashed_nodes[id] = node

86 return placeholder

87

88 def __handleInline(self, data, patternIndex=0):

89 """

90 Process string with inline patterns and replace it

91 with placeholders

92

93 Keyword arguments:

94

95 * data: A line of Markdown text

96 * patternIndex: The index of the inlinePattern to start with

97

98 Returns: String with placeholders.

99

100 """

101 if not isinstance(data, util.AtomicString):

102 startIndex = 0

103 while patternIndex < len(self.inlinePatterns):

104 data, matched, startIndex = self.__applyPattern(

105 self.inlinePatterns.value_for_index(patternIndex),

106 data, patternIndex, startIndex)

107 if not matched:

108 patternIndex += 1

109 return data

110

111 def __processElementText(self, node, subnode, isText=True):

112 """

113 Process placeholders in Element.text or Element.tail

114 of Elements popped from self.stashed_nodes.

115

116 Keywords arguments:

117

118 * node: parent node

119 * subnode: processing node

120 * isText: bool variable, True - it's text, False - it's tail

121

122 Returns: None

123

124 """

125 if isText:

126 text = subnode.text

127 subnode.text = None

128 else:

129 text = subnode.tail

130 subnode.tail = None

131

132 childResult = self.__processPlaceholders(text, subnode, isText)

133

134 if not isText and node is not subnode:

135 pos = list(node).index(subnode) + 1

136 else:

137 pos = 0

138

139 childResult.reverse()

140 for newChild in childResult:

141 node.insert(pos, newChild)

142

143 def __processPlaceholders(self, data, parent, isText=True):

144 """

145 Process string with placeholders and generate ElementTree tree.

146

147 Keyword arguments:

148

149 * data: string with placeholders instead of ElementTree elements.

150 * parent: Element, which contains processing inline data

151

152 Returns: list with ElementTree elements with applied inline patterns.

153

154 """

155 def linkText(text):

156 if text:

157 if result:

158 if result[-1].tail:

159 result[-1].tail += text

160 else:

161 result[-1].tail = text

162 elif not isText:

163 if parent.tail:

164 parent.tail += text

165 else:

166 parent.tail = text

167 else:

168 if parent.text:

169 parent.text += text

170 else:

171 parent.text = text

172 result = []

173 strartIndex = 0

174 while data:

175 index = data.find(self.__placeholder_prefix, strartIndex)

176 if index != -1:

177 id, phEndIndex = self.__findPlaceholder(data, index)

178

179 if id in self.stashed_nodes:

180 node = self.stashed_nodes.get(id)

181

182 if index > 0:

183 text = data[strartIndex:index]

184 linkText(text)

185

186 if not isString(node): # it's Element

187 for child in [node] + list(node):

188 if child.tail:

189 if child.tail.strip():

190 self.__processElementText(

191 node, child, False

192 )

193 if child.text:

194 if child.text.strip():

195 self.__processElementText(child, child)

196 else: # it's just a string

197 linkText(node)

198 strartIndex = phEndIndex

199 continue

200

201 strartIndex = phEndIndex

202 result.append(node)

203

204 else: # wrong placeholder

205 end = index + len(self.__placeholder_prefix)

206 linkText(data[strartIndex:end])

207 strartIndex = end

208 else:

209 text = data[strartIndex:]

210 if isinstance(data, util.AtomicString):

211 # We don't want to loose the AtomicString

212 text = util.AtomicString(text)

213 linkText(text)

214 data = ""

215

216 return result

217

218 def __applyPattern(self, pattern, data, patternIndex, startIndex=0):

219 """

220 Check if the line fits the pattern, create the necessary

221 elements, add it to stashed_nodes.

222

223 Keyword arguments:

224

225 * data: the text to be processed

226 * pattern: the pattern to be checked

227 * patternIndex: index of current pattern

228 * startIndex: string index, from which we start searching

229

230 Returns: String with placeholders instead of ElementTree elements.

231

232 """

233 match = pattern.getCompiledRegExp().match(data[startIndex:])

234 leftData = data[:startIndex]

235

236 if not match:

237 return data, False, 0

238

239 node = pattern.handleMatch(match)

240

241 if node is None:

242 return data, True, len(leftData)+match.span(len(match.groups()))[0]

243

244 if not isString(node):

245 if not isinstance(node.text, util.AtomicString):

246 # We need to process current node too

247 for child in [node] + list(node):

248 if not isString(node):

249 if child.text:

250 child.text = self.__handleInline(

251 child.text, patternIndex + 1

252 )

253 if child.tail:

254 child.tail = self.__handleInline(

255 child.tail, patternIndex

256 )

257

258 placeholder = self.__stashNode(node, pattern.type())

259

260 return "%s%s%s%s" % (leftData,

261 match.group(1),

262 placeholder, match.groups()[-1]), True, 0

263

264 def run(self, tree):

265 """Apply inline patterns to a parsed Markdown tree.

266

267 Iterate over ElementTree, find elements with inline tag, apply inline

268 patterns and append newly created Elements to tree. If you don't

269 want to process your data with inline paterns, instead of normal

270 string, use subclass AtomicString:

271

272 node.text = markdown.AtomicString("This will not be processed.")

273

274 Arguments:

275

276 * tree: ElementTree object, representing Markdown tree.

277

278 Returns: ElementTree object with applied inline patterns.

279

280 """

281 self.stashed_nodes = {}

282

283 stack = [tree]

284

285 while stack:

286 currElement = stack.pop()

287 insertQueue = []

288 for child in currElement:

289 if child.text and not isinstance(

290 child.text, util.AtomicString

291 ):

292 text = child.text

293 child.text = None

294 lst = self.__processPlaceholders(

295 self.__handleInline(text), child

296 )

297 stack += lst

298 insertQueue.append((child, lst))

299 if child.tail:

300 tail = self.__handleInline(child.tail)

301 dumby = util.etree.Element('d')

302 child.tail = None

303 tailResult = self.__processPlaceholders(tail, dumby, False)

304 if dumby.tail:

305 child.tail = dumby.tail

306 pos = list(currElement).index(child) + 1

307 tailResult.reverse()

308 for newChild in tailResult:

309 currElement.insert(pos, newChild)

310 if len(child):

311 stack.append(child)

312

313 for element, lst in insertQueue:

314 if self.markdown.enable_attributes:

315 if element.text and isString(element.text):

316 element.text = inlinepatterns.handleAttributes(

317 element.text, element

318 )

319 i = 0

320 for newChild in lst:

321 if self.markdown.enable_attributes:

322 # Processing attributes

323 if newChild.tail and isString(newChild.tail):

324 newChild.tail = inlinepatterns.handleAttributes(

325 newChild.tail, element

326 )

327 if newChild.text and isString(newChild.text):

328 newChild.text = inlinepatterns.handleAttributes(

329 newChild.text, newChild

330 )

331 element.insert(i, newChild)

332 i += 1

333 return tree

334

335

336 class PrettifyTreeprocessor(Treeprocessor):

337 """ Add linebreaks to the html document. """

338

339 def _prettifyETree(self, elem):

340 """ Recursively add linebreaks to ElementTree children. """

341

342 i = "\n"

343 if util.isBlockLevel(elem.tag) and elem.tag not in ['code', 'pre']:

344 if (not elem.text or not elem.text.strip()) \

345 and len(elem) and util.isBlockLevel(elem[0].tag):

346 elem.text = i

347 for e in elem:

348 if util.isBlockLevel(e.tag):

349 self._prettifyETree(e)

350 if not elem.tail or not elem.tail.strip():

351 elem.tail = i

352 if not elem.tail or not elem.tail.strip():

353 elem.tail = i

354

355 def run(self, root):

356 """ Add linebreaks to ElementTree root object. """

357

358 self._prettifyETree(root)

359 # Do <br />'s seperately as they are often in the middle of

360 # inline content and missed by _prettifyETree.

361 brs = root.getiterator('br')

362 for br in brs:

363 if not br.tail or not br.tail.strip():

364 br.tail = '\n'

365 else:

366 br.tail = '\n%s' % br.tail

367 # Clean up extra empty lines at end of code blocks.

368 pres = root.getiterator('pre')

369 for pre in pres:

370 if len(pre) and pre[0].tag == 'code':

371 pre[0].text = util.AtomicString(pre[0].text.rstrip() + '\n')

OLD	NEW

« no previous file with comments | « third_party/Python-Markdown/markdown/serializers.py ('k') | third_party/Python-Markdown/markdown/util.py » ('j') | no next file with comments »