test_parser.py 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556
  1. # -*- coding: utf-8 -*-
  2. from __future__ import unicode_literals
  3. from django.contrib.auth import get_user_model
  4. from django.test import TestCase
  5. from misago.markup.parser import parse
  6. UserModel = get_user_model()
  7. class MockRequest(object):
  8. scheme = 'http'
  9. def __init__(self, user=None):
  10. self.user = user
  11. def get_host(self):
  12. return 'test.com'
  13. class MockPoster(object):
  14. username = 'LoremIpsum'
  15. slug = 'loremipsum'
  16. class BBCodeTests(TestCase):
  17. def test_inline_text(self):
  18. """inline elements are correctly parsed"""
  19. test_text = """
  20. Lorem **ipsum**, dolor met.
  21. Lorem [b]ipsum[/b], [i]dolor[/i] [u]met[/u].
  22. Lorem [b]**ipsum**[/b] [i]dolor[/i] [u]met[/u].
  23. Lorem [b]**ipsum[/b]** [i]dolor[/i] [u]met[/u].
  24. Lorem [b]__ipsum[/b]__ [i]dolor[/i] [u]met[/u].
  25. Lorem [b][i]ipsum[/i][/b].
  26. Lorem [b][i]ipsum[/b][/i].
  27. Lorem [b]ipsum[/B].
  28. """.strip()
  29. expected_result = """
  30. <p>Lorem <strong>ipsum</strong>, dolor met.</p>
  31. <p>Lorem <b>ipsum</b>, <i>dolor</i> <u>met</u>.</p>
  32. <p>Lorem <b><strong>ipsum</strong></b> <i>dolor</i> <u>met</u>.</p>
  33. <p>Lorem <b>**ipsum</b>** <i>dolor</i> <u>met</u>.</p>
  34. <p>Lorem <b>__ipsum</b>__ <i>dolor</i> <u>met</u>.</p>
  35. <p>Lorem <b><i>ipsum</i></b>.</p>
  36. <p>Lorem <b>[i]ipsum</b>[/i].</p>
  37. <p>Lorem <b>ipsum</b>.</p>
  38. """.strip()
  39. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  40. self.assertEqual(expected_result, result['parsed_text'])
  41. def test_hr(self):
  42. """hr bbcode is correctly parsed"""
  43. test_text = """
  44. Lorem ipsum.
  45. [hr]
  46. Dolor met.
  47. """.strip()
  48. expected_result = """
  49. <p>Lorem ipsum.</p>
  50. <hr/>
  51. <p>Dolor met.</p>
  52. """.strip()
  53. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  54. self.assertEqual(expected_result, result['parsed_text'])
  55. class MinifyTests(TestCase):
  56. def test_minified_text(self):
  57. """parser minifies text successfully"""
  58. test_text = """
  59. Lorem ipsum.
  60. Lorem ipsum.
  61. """.strip()
  62. expected_result = """
  63. <p>Lorem ipsum.</p><p>Lorem ipsum.</p>
  64. """.strip()
  65. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  66. self.assertEqual(expected_result, result['parsed_text'])
  67. def test_minified_unicode_text(self):
  68. """parser minifies unicode text successfully"""
  69. test_text = """
  70. Bżęczyszczykiewłicz ipsum.
  71. Lorem ipsum.
  72. """.strip()
  73. expected_result = """
  74. <p>Bżęczyszczykiewłicz ipsum.</p><p>Lorem ipsum.</p>
  75. """.strip()
  76. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  77. self.assertEqual(expected_result, result['parsed_text'])
  78. def test_complex_paragraph(self):
  79. """parser minifies complex paragraph"""
  80. user = UserModel.objects.create_user('Bob', 'bob@test.com', 'Pass123')
  81. test_text = """
  82. Hey there @{}, how's going?
  83. """.strip().format(user)
  84. expected_result = """
  85. <p>Hey there <a href="{}">@{}</a>, how's going?</p>
  86. """.strip().format(user.get_absolute_url(), user)
  87. result = parse(test_text, MockRequest(user), user, minify=True)
  88. self.assertEqual(expected_result, result['parsed_text'])
  89. class CleanLinksTests(TestCase):
  90. def test_clean_current_link(self):
  91. """clean_links step cleans http://test.com"""
  92. test_text = """
  93. Lorem ipsum: http://test.com
  94. """.strip()
  95. expected_result = """
  96. <p>Lorem ipsum: <a href="/" rel="nofollow">test.com</a></p>
  97. """.strip()
  98. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  99. self.assertEqual(expected_result, result['parsed_text'])
  100. self.assertEqual(result['internal_links'], ['/'])
  101. self.assertEqual(result['images'], [])
  102. self.assertEqual(result['outgoing_links'], [])
  103. def test_clean_schemaless_link(self):
  104. """clean_links step cleans test.com"""
  105. test_text = """
  106. Lorem ipsum: test.com
  107. """.strip()
  108. expected_result = """
  109. <p>Lorem ipsum: <a href="/" rel="nofollow">test.com</a></p>
  110. """.strip()
  111. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  112. self.assertEqual(expected_result, result['parsed_text'])
  113. self.assertEqual(result['internal_links'], ['/'])
  114. self.assertEqual(result['images'], [])
  115. self.assertEqual(result['outgoing_links'], [])
  116. def test_trim_current_path(self):
  117. """clean_links step leaves http://test.com path"""
  118. test_text = """
  119. Lorem ipsum: http://test.com/somewhere-something/
  120. """.strip()
  121. expected_result = """
  122. <p>Lorem ipsum: <a href="/somewhere-something/" rel="nofollow">test.com/somewhere-something/</a></p>
  123. """.strip()
  124. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  125. self.assertEqual(expected_result, result['parsed_text'])
  126. self.assertEqual(result['internal_links'], ['/somewhere-something/'])
  127. self.assertEqual(result['images'], [])
  128. self.assertEqual(result['outgoing_links'], [])
  129. def test_clean_outgoing_link_domain(self):
  130. """clean_links step leaves outgoing domain link"""
  131. test_text = """
  132. Lorem ipsum: http://somewhere.com
  133. """.strip()
  134. expected_result = """
  135. <p>Lorem ipsum: <a href="http://somewhere.com" rel="nofollow">somewhere.com</a></p>
  136. """.strip()
  137. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  138. self.assertEqual(expected_result, result['parsed_text'])
  139. self.assertEqual(result['outgoing_links'], ['http://somewhere.com'])
  140. self.assertEqual(result['images'], [])
  141. self.assertEqual(result['internal_links'], [])
  142. def test_trim_outgoing_path(self):
  143. """clean_links step leaves outgoing link domain and path"""
  144. test_text = """
  145. Lorem ipsum: http://somewhere.com/somewhere-something/
  146. """.strip()
  147. expected_result = """
  148. <p>Lorem ipsum: <a href="http://somewhere.com/somewhere-something/" rel="nofollow">somewhere.com/somewhere-something/</a></p>
  149. """.strip()
  150. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  151. self.assertEqual(expected_result, result['parsed_text'])
  152. self.assertEqual(result['outgoing_links'], ['http://somewhere.com/somewhere-something/'])
  153. self.assertEqual(result['images'], [])
  154. self.assertEqual(result['internal_links'], [])
  155. def test_clean_local_image_src(self):
  156. """clean_links step cleans local image src"""
  157. test_text = """
  158. !(http://test.com/image.jpg)
  159. """.strip()
  160. expected_result = """
  161. <p><img alt="test.com/image.jpg" src="/image.jpg"/></p>
  162. """.strip()
  163. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  164. self.assertEqual(expected_result, result['parsed_text'])
  165. self.assertEqual(result['images'], ['/image.jpg'])
  166. self.assertEqual(result['internal_links'], [])
  167. self.assertEqual(result['outgoing_links'], [])
  168. def test_clean_remote_image_src(self):
  169. """clean_links step cleans remote image src"""
  170. test_text = """
  171. !(http://somewhere.com/image.jpg)
  172. """.strip()
  173. expected_result = """
  174. <p><img alt="somewhere.com/image.jpg" src="http://somewhere.com/image.jpg"/></p>
  175. """.strip()
  176. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  177. self.assertEqual(expected_result, result['parsed_text'])
  178. self.assertEqual(result['images'], ['somewhere.com/image.jpg'])
  179. self.assertEqual(result['internal_links'], [])
  180. self.assertEqual(result['outgoing_links'], [])
  181. def test_clean_linked_image(self):
  182. """parser handles image element nested in link"""
  183. test_text = """
  184. [![3.png](http://test.com/a/thumb/test/43/)](http://test.com/a/test/43/)
  185. """.strip()
  186. expected_result = """
  187. <p><a href="/a/test/43/" rel="nofollow"><img alt="3.png" src="/a/thumb/test/43/"/></a></p>
  188. """.strip()
  189. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  190. self.assertEqual(expected_result, result['parsed_text'])
  191. self.assertEqual(result['images'], ['/a/thumb/test/43/'])
  192. self.assertEqual(result['internal_links'], ['/a/test/43/'])
  193. self.assertEqual(result['outgoing_links'], [])
  194. def test_force_shva(self):
  195. """parser appends ?shva=1 bit to attachment links if flag is present"""
  196. test_text = """
  197. ![3.png](http://test.com/a/thumb/test/43/)
  198. """.strip()
  199. expected_result = """
  200. <p><img alt="3.png" src="/a/thumb/test/43/?shva=1"/></p>
  201. """.strip()
  202. result = parse(test_text, MockRequest(), MockPoster(), minify=True, force_shva=True)
  203. self.assertEqual(expected_result, result['parsed_text'])
  204. self.assertEqual(result['images'], ['/a/thumb/test/43/'])
  205. self.assertEqual(result['internal_links'], [])
  206. self.assertEqual(result['outgoing_links'], [])
  207. def test_remove_shva(self):
  208. """parser removes ?shva=1 bit from attachment links if flag is absent"""
  209. test_text = """
  210. ![3.png](http://test.com/a/thumb/test/43/?shva=1)
  211. """.strip()
  212. expected_result = """
  213. <p><img alt="3.png" src="/a/thumb/test/43/"/></p>
  214. """.strip()
  215. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  216. self.assertEqual(expected_result, result['parsed_text'])
  217. self.assertEqual(result['images'], ['/a/thumb/test/43/?shva=1'])
  218. self.assertEqual(result['internal_links'], [])
  219. self.assertEqual(result['outgoing_links'], [])
  220. class LinkifyTests(TestCase):
  221. def test_clean_current_link(self):
  222. """clean_links step cleans http://test.com"""
  223. test_text = """
  224. Lorem ipsum: `<http://test.com>`
  225. """.strip()
  226. expected_result = """
  227. <p>Lorem ipsum: <code>&lt;http://test.com&gt;</code></p>
  228. """.strip()
  229. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  230. self.assertEqual(expected_result, result['parsed_text'])
  231. self.assertEqual(result['internal_links'], [])
  232. self.assertEqual(result['images'], [])
  233. self.assertEqual(result['outgoing_links'], [])
  234. class StriketroughTests(TestCase):
  235. def test_striketrough(self):
  236. """striketrough markdown deletes test"""
  237. test_text = """
  238. Lorem ~~ipsum, dolor~~ met.
  239. """.strip()
  240. expected_result = """
  241. <p>Lorem <del>ipsum, dolor</del> met.</p>
  242. """.strip()
  243. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  244. self.assertEqual(expected_result, result['parsed_text'])
  245. class QuoteTests(TestCase):
  246. def test_quotes(self):
  247. """bbcode for quote is supported"""
  248. test_text = """
  249. Lorem ipsum.
  250. [quote]Dolor met[/quote]
  251. [quote]Dolor <b>met</b>[/quote]
  252. [quote]Dolor **met**[quote]Dolor met[/quote][/quote]
  253. """.strip()
  254. expected_result = """
  255. <p>Lorem ipsum.</p>
  256. <aside class="quote-block">
  257. <div class="quote-heading"></div>
  258. <blockquote class="quote-body">
  259. <p>Dolor met</p>
  260. </blockquote>
  261. </aside>
  262. <aside class="quote-block">
  263. <div class="quote-heading"></div>
  264. <blockquote class="quote-body">
  265. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  266. </blockquote>
  267. </aside>
  268. <aside class="quote-block">
  269. <div class="quote-heading"></div>
  270. <blockquote class="quote-body">
  271. <p>Dolor <strong>met</strong></p>
  272. <aside class="quote-block">
  273. <div class="quote-heading"></div>
  274. <blockquote class="quote-body">
  275. <p>Dolor met</p>
  276. </blockquote>
  277. </aside>
  278. </blockquote>
  279. </aside>
  280. """.strip()
  281. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  282. self.assertEqual(expected_result, result['parsed_text'])
  283. def test_authored_quotes(self):
  284. """bbcode for authored quote is supported and handles mentions as well"""
  285. test_text = """
  286. Lorem ipsum.
  287. [quote]Dolor met[/quote]
  288. [quote=\"@Bob\"]Dolor <b>met</b>[/quote]
  289. [quote]Dolor **met**[quote=@Bob]Dolor met[/quote][/quote]
  290. """.strip()
  291. expected_result = """
  292. <p>Lorem ipsum.</p>
  293. <aside class="quote-block">
  294. <div class="quote-heading"></div>
  295. <blockquote class="quote-body">
  296. <p>Dolor met</p>
  297. </blockquote>
  298. </aside>
  299. <aside class="quote-block">
  300. <div class="quote-heading">@Bob</div>
  301. <blockquote class="quote-body">
  302. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  303. </blockquote>
  304. </aside>
  305. <aside class="quote-block">
  306. <div class="quote-heading"></div>
  307. <blockquote class="quote-body">
  308. <p>Dolor <strong>met</strong></p>
  309. <aside class="quote-block">
  310. <div class="quote-heading">@Bob</div>
  311. <blockquote class="quote-body">
  312. <p>Dolor met</p>
  313. </blockquote>
  314. </aside>
  315. </blockquote>
  316. </aside>
  317. """.strip()
  318. request = MockRequest(user=MockPoster())
  319. result = parse(test_text, request, MockPoster(), minify=False)
  320. self.assertEqual(expected_result, result['parsed_text'])
  321. def test_custom_quote_title(self):
  322. """parser handles custom quotetitle"""
  323. test_text = """
  324. Lorem ipsum.
  325. [quote=\"Lorem ipsum very test\"]Dolor <b>met</b>[/quote]
  326. """.strip()
  327. expected_result = """
  328. <p>Lorem ipsum.</p>
  329. <aside class="quote-block">
  330. <div class="quote-heading">Lorem ipsum very test</div>
  331. <blockquote class="quote-body">
  332. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  333. </blockquote>
  334. </aside>
  335. """.strip()
  336. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  337. self.assertEqual(expected_result, result['parsed_text'])
  338. def test_hr_edge_case(self):
  339. """test for weird edge case in which hr gets moved outside of quote"""
  340. test_text = """
  341. Lorem ipsum.
  342. [quote]
  343. Dolor met
  344. - - - - -
  345. Amet elit
  346. [/quote]
  347. """.strip()
  348. expected_result = """
  349. <p>Lorem ipsum.</p>
  350. <aside class="quote-block">
  351. <div class="quote-heading"></div>
  352. <blockquote class="quote-body">
  353. <p>Dolor met</p>
  354. <hr/>
  355. <p>Amet elit</p>
  356. </blockquote>
  357. </aside>
  358. """.strip()
  359. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  360. self.assertEqual(expected_result, result['parsed_text'])
  361. class CodeTests(TestCase):
  362. def test_code(self):
  363. """code bbcode is correctly parsed"""
  364. test_text = """
  365. Lorem ipsum.
  366. [code]
  367. Dolor [b]met.[/b]
  368. [/code]
  369. """.strip()
  370. expected_result = """
  371. <p>Lorem ipsum.</p>
  372. <pre><code>Dolor [b]met.[/b]</code></pre>
  373. """.strip()
  374. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  375. self.assertEqual(expected_result, result['parsed_text'])
  376. def test_inline_code(self):
  377. """inline code bbcode is correctly parsed"""
  378. test_text = """
  379. Lorem ipsum.
  380. [code]Dolor [b]met.[/b][/code]
  381. """.strip()
  382. expected_result = """
  383. <p>Lorem ipsum.</p>
  384. <pre><code>Dolor [b]met.[/b]</code></pre>
  385. """.strip()
  386. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  387. self.assertEqual(expected_result, result['parsed_text'])
  388. def test_code_strip(self):
  389. """code bbcode trims its content"""
  390. test_text = """
  391. Lorem ipsum.
  392. [code]
  393. Dolor [b]met.[/b]
  394. [/code]
  395. """.strip()
  396. expected_result = """
  397. <p>Lorem ipsum.</p>
  398. <pre><code> Dolor [b]met.[/b]</code></pre>
  399. """.strip()
  400. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  401. self.assertEqual(expected_result, result['parsed_text'])
  402. def test_code_language(self):
  403. """code bbcode with language is correctly parsed"""
  404. test_text = """
  405. Lorem ipsum.
  406. [code="python"]
  407. Dolor [b]met.[/b]
  408. [/code]
  409. """.strip()
  410. expected_result = """
  411. <p>Lorem ipsum.</p>
  412. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  413. """.strip()
  414. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  415. self.assertEqual(expected_result, result['parsed_text'])
  416. def test_code_language_optional_quotes(self):
  417. """code quotes around language name are optional"""
  418. test_text = """
  419. Lorem ipsum.
  420. [code=python"]
  421. Dolor [b]met.[/b]
  422. [/code]
  423. """.strip()
  424. expected_result = """
  425. <p>Lorem ipsum.</p>
  426. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  427. """.strip()
  428. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  429. self.assertEqual(expected_result, result['parsed_text'])
  430. test_text = """
  431. Lorem ipsum.
  432. [code="python]
  433. Dolor [b]met.[/b]
  434. [/code]
  435. """.strip()
  436. expected_result = """
  437. <p>Lorem ipsum.</p>
  438. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  439. """.strip()
  440. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  441. self.assertEqual(expected_result, result['parsed_text'])