test_parser.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614
  1. from __future__ import unicode_literals
  2. from django.contrib.auth import get_user_model
  3. from django.test import TestCase
  4. from misago.markup.parser import parse
  5. UserModel = get_user_model()
  6. class MockRequest(object):
  7. scheme = 'http'
  8. def __init__(self, user=None):
  9. self.user = user
  10. def get_host(self):
  11. return 'test.com'
  12. class MockPoster(object):
  13. username = 'LoremIpsum'
  14. slug = 'loremipsum'
  15. class HTMLTests(TestCase):
  16. def test_html_escaped(self):
  17. """parser escapes all html"""
  18. test_text = """
  19. Lorem <strong>ipsum!</strong>
  20. """.strip()
  21. expected_result = """
  22. <p>Lorem &lt;strong&gt;ipsum!&lt;/strong&gt;</p>
  23. """.strip()
  24. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  25. self.assertEqual(expected_result, result['parsed_text'])
  26. self.assertEqual(result['internal_links'], [])
  27. self.assertEqual(result['images'], [])
  28. self.assertEqual(result['outgoing_links'], [])
  29. class BBCodeTests(TestCase):
  30. def test_inline_text(self):
  31. """inline elements are correctly parsed"""
  32. test_text = """
  33. Lorem **ipsum**, dolor met.
  34. Lorem [b]ipsum[/b], [i]dolor[/i] [u]met[/u].
  35. Lorem [b]**ipsum**[/b] [i]dolor[/i] [u]met[/u].
  36. Lorem [b]**ipsum[/b]** [i]dolor[/i] [u]met[/u].
  37. Lorem [b]__ipsum[/b]__ [i]dolor[/i] [u]met[/u].
  38. Lorem [b][i]ipsum[/i][/b].
  39. Lorem [b][i]ipsum[/b][/i].
  40. Lorem [b]ipsum[/B].
  41. """.strip()
  42. expected_result = """
  43. <p>Lorem <strong>ipsum</strong>, dolor met.</p>
  44. <p>Lorem <b>ipsum</b>, <i>dolor</i> <u>met</u>.</p>
  45. <p>Lorem <b><strong>ipsum</strong></b> <i>dolor</i> <u>met</u>.</p>
  46. <p>Lorem <b>**ipsum</b>** <i>dolor</i> <u>met</u>.</p>
  47. <p>Lorem <b>__ipsum</b>__ <i>dolor</i> <u>met</u>.</p>
  48. <p>Lorem <b><i>ipsum</i></b>.</p>
  49. <p>Lorem <b>[i]ipsum</b>[/i].</p>
  50. <p>Lorem <b>ipsum</b>.</p>
  51. """.strip()
  52. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  53. self.assertEqual(expected_result, result['parsed_text'])
  54. def test_hr(self):
  55. """hr bbcode is correctly parsed"""
  56. test_text = """
  57. Lorem ipsum.
  58. [hr]
  59. Dolor met.
  60. """.strip()
  61. expected_result = """
  62. <p>Lorem ipsum.</p>
  63. <hr/>
  64. <p>Dolor met.</p>
  65. """.strip()
  66. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  67. self.assertEqual(expected_result, result['parsed_text'])
  68. def test_img(self):
  69. """img bbcode is correctly parsed"""
  70. test_text = """
  71. Lorem ipsum [img]https://placekitten.com/g/1200/500[/img]
  72. Lorem ipsum [iMg]https://placekitten.com/g/1200/500[/ImG]
  73. Lorem ipsum !(https://placekitten.com/g/1200/500)
  74. """.strip()
  75. expected_result = """
  76. <p>Lorem ipsum <img alt="placekitten.com/g/1200/500" src="https://placekitten.com/g/1200/500"/></p>
  77. <p>Lorem ipsum <img alt="placekitten.com/g/1200/500" src="https://placekitten.com/g/1200/500"/></p>
  78. <p>Lorem ipsum <img alt="placekitten.com/g/1200/500" src="https://placekitten.com/g/1200/500"/></p>
  79. """.strip()
  80. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  81. self.assertEqual(expected_result, result['parsed_text'])
  82. def test_url(self):
  83. """url bbcode is correctly parsed"""
  84. test_text = """
  85. Lorem ipsum [url]placekitten.com/g/300/300[/url]
  86. Lorem ipsum [url]https://placekitten.com/g/600/600[/url]
  87. Lorem ipsum [uRL=https://placekitten.com/g/400/400"]Label text![/UrL]
  88. Lorem ipsum [Lorem ipsum](https://placekitten.com/g/1200/500)
  89. """.strip()
  90. expected_result = """
  91. <p>Lorem ipsum <a href="http://placekitten.com/g/300/300" rel="nofollow noopener">placekitten.com/g/300/300</a></p>
  92. <p>Lorem ipsum <a href="https://placekitten.com/g/600/600" rel="nofollow noopener">placekitten.com/g/600/600</a></p>
  93. <p>Lorem ipsum <a href="https://placekitten.com/g/400/400" rel="nofollow noopener">Label text!</a></p>
  94. <p>Lorem ipsum <a href="https://placekitten.com/g/1200/500" rel="nofollow noopener">Lorem ipsum</a></p>
  95. """.strip()
  96. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  97. self.assertEqual(expected_result, result['parsed_text'])
  98. class MinifyTests(TestCase):
  99. def test_minified_text(self):
  100. """parser minifies text successfully"""
  101. test_text = """
  102. Lorem ipsum.
  103. Lorem ipsum.
  104. """.strip()
  105. expected_result = """
  106. <p>Lorem ipsum.</p><p>Lorem ipsum.</p>
  107. """.strip()
  108. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  109. self.assertEqual(expected_result, result['parsed_text'])
  110. def test_minified_unicode_text(self):
  111. """parser minifies unicode text successfully"""
  112. test_text = """
  113. Bżęczyszczykiewłicz ipsum.
  114. Lorem ipsum.
  115. """.strip()
  116. expected_result = """
  117. <p>Bżęczyszczykiewłicz ipsum.</p><p>Lorem ipsum.</p>
  118. """.strip()
  119. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  120. self.assertEqual(expected_result, result['parsed_text'])
  121. def test_complex_paragraph(self):
  122. """parser minifies complex paragraph"""
  123. user = UserModel.objects.create_user('Bob', 'bob@test.com', 'Pass123')
  124. test_text = """
  125. Hey there @{}, how's going?
  126. """.strip().format(user)
  127. expected_result = """
  128. <p>Hey there <a href="{}">@{}</a>, how's going?</p>
  129. """.strip().format(user.get_absolute_url(), user)
  130. result = parse(test_text, MockRequest(user), user, minify=True)
  131. self.assertEqual(expected_result, result['parsed_text'])
  132. class CleanLinksTests(TestCase):
  133. def test_clean_current_link(self):
  134. """clean_links step cleans http://test.com"""
  135. test_text = """
  136. Lorem ipsum: http://test.com
  137. """.strip()
  138. expected_result = """
  139. <p>Lorem ipsum: <a href="/">test.com</a></p>
  140. """.strip()
  141. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  142. self.assertEqual(expected_result, result['parsed_text'])
  143. self.assertEqual(result['internal_links'], ['/'])
  144. self.assertEqual(result['images'], [])
  145. self.assertEqual(result['outgoing_links'], [])
  146. def test_clean_schemaless_link(self):
  147. """clean_links step cleans test.com"""
  148. test_text = """
  149. Lorem ipsum: test.com
  150. """.strip()
  151. expected_result = """
  152. <p>Lorem ipsum: <a href="/">test.com</a></p>
  153. """.strip()
  154. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  155. self.assertEqual(expected_result, result['parsed_text'])
  156. self.assertEqual(result['internal_links'], ['/'])
  157. self.assertEqual(result['images'], [])
  158. self.assertEqual(result['outgoing_links'], [])
  159. def test_trim_current_path(self):
  160. """clean_links step leaves http://test.com path"""
  161. test_text = """
  162. Lorem ipsum: http://test.com/somewhere-something/
  163. """.strip()
  164. expected_result = """
  165. <p>Lorem ipsum: <a href="/somewhere-something/">test.com/somewhere-something/</a></p>
  166. """.strip()
  167. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  168. self.assertEqual(expected_result, result['parsed_text'])
  169. self.assertEqual(result['internal_links'], ['/somewhere-something/'])
  170. self.assertEqual(result['images'], [])
  171. self.assertEqual(result['outgoing_links'], [])
  172. def test_clean_outgoing_link_domain(self):
  173. """clean_links step leaves outgoing domain link"""
  174. test_text = """
  175. Lorem ipsum: http://somewhere.com
  176. """.strip()
  177. expected_result = """
  178. <p>Lorem ipsum: <a href="http://somewhere.com" rel="nofollow noopener">somewhere.com</a></p>
  179. """.strip()
  180. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  181. self.assertEqual(expected_result, result['parsed_text'])
  182. self.assertEqual(result['outgoing_links'], ['somewhere.com'])
  183. self.assertEqual(result['images'], [])
  184. self.assertEqual(result['internal_links'], [])
  185. def test_trim_outgoing_path(self):
  186. """clean_links step leaves outgoing link domain and path"""
  187. test_text = """
  188. Lorem ipsum: http://somewhere.com/somewhere-something/
  189. """.strip()
  190. expected_result = """
  191. <p>Lorem ipsum: <a href="http://somewhere.com/somewhere-something/" rel="nofollow noopener">somewhere.com/somewhere-something/</a></p>
  192. """.strip()
  193. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  194. self.assertEqual(expected_result, result['parsed_text'])
  195. self.assertEqual(result['outgoing_links'], ['somewhere.com/somewhere-something/'])
  196. self.assertEqual(result['images'], [])
  197. self.assertEqual(result['internal_links'], [])
  198. def test_clean_local_image_src(self):
  199. """clean_links step cleans local image src"""
  200. test_text = """
  201. !(http://test.com/image.jpg)
  202. """.strip()
  203. expected_result = """
  204. <p><img alt="test.com/image.jpg" src="/image.jpg"/></p>
  205. """.strip()
  206. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  207. self.assertEqual(expected_result, result['parsed_text'])
  208. self.assertEqual(result['images'], ['/image.jpg'])
  209. self.assertEqual(result['internal_links'], [])
  210. self.assertEqual(result['outgoing_links'], [])
  211. def test_clean_remote_image_src(self):
  212. """clean_links step cleans remote image src"""
  213. test_text = """
  214. !(http://somewhere.com/image.jpg)
  215. """.strip()
  216. expected_result = """
  217. <p><img alt="somewhere.com/image.jpg" src="http://somewhere.com/image.jpg"/></p>
  218. """.strip()
  219. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  220. self.assertEqual(expected_result, result['parsed_text'])
  221. self.assertEqual(result['images'], ['somewhere.com/image.jpg'])
  222. self.assertEqual(result['internal_links'], [])
  223. self.assertEqual(result['outgoing_links'], [])
  224. def test_clean_linked_image(self):
  225. """parser handles image element nested in link"""
  226. test_text = """
  227. [![3.png](http://test.com/a/thumb/test/43/)](http://test.com/a/test/43/)
  228. """.strip()
  229. expected_result = """
  230. <p><a href="/a/test/43/"><img alt="3.png" src="/a/thumb/test/43/"/></a></p>
  231. """.strip()
  232. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  233. self.assertEqual(expected_result, result['parsed_text'])
  234. self.assertEqual(result['images'], ['/a/thumb/test/43/'])
  235. self.assertEqual(result['internal_links'], ['/a/test/43/'])
  236. self.assertEqual(result['outgoing_links'], [])
  237. def test_force_shva(self):
  238. """parser appends ?shva=1 bit to attachment links if flag is present"""
  239. test_text = """
  240. ![3.png](http://test.com/a/thumb/test/43/)
  241. """.strip()
  242. expected_result = """
  243. <p><img alt="3.png" src="/a/thumb/test/43/?shva=1"/></p>
  244. """.strip()
  245. result = parse(test_text, MockRequest(), MockPoster(), minify=True, force_shva=True)
  246. self.assertEqual(expected_result, result['parsed_text'])
  247. self.assertEqual(result['images'], ['/a/thumb/test/43/'])
  248. self.assertEqual(result['internal_links'], [])
  249. self.assertEqual(result['outgoing_links'], [])
  250. def test_remove_shva(self):
  251. """parser removes ?shva=1 bit from attachment links if flag is absent"""
  252. test_text = """
  253. ![3.png](http://test.com/a/thumb/test/43/?shva=1)
  254. """.strip()
  255. expected_result = """
  256. <p><img alt="3.png" src="/a/thumb/test/43/"/></p>
  257. """.strip()
  258. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  259. self.assertEqual(expected_result, result['parsed_text'])
  260. self.assertEqual(result['images'], ['/a/thumb/test/43/?shva=1'])
  261. self.assertEqual(result['internal_links'], [])
  262. self.assertEqual(result['outgoing_links'], [])
  263. class LinkifyTests(TestCase):
  264. def test_clean_current_link(self):
  265. """clean_links step cleans http://test.com"""
  266. test_text = """
  267. Lorem ipsum: `<http://test.com>`
  268. """.strip()
  269. expected_result = """
  270. <p>Lorem ipsum: <code>&lt;http://test.com&gt;</code></p>
  271. """.strip()
  272. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  273. self.assertEqual(expected_result, result['parsed_text'])
  274. self.assertEqual(result['internal_links'], [])
  275. self.assertEqual(result['images'], [])
  276. self.assertEqual(result['outgoing_links'], [])
  277. class StriketroughTests(TestCase):
  278. def test_striketrough(self):
  279. """striketrough markdown deletes test"""
  280. test_text = """
  281. Lorem ~~ipsum, dolor~~ met.
  282. """.strip()
  283. expected_result = """
  284. <p>Lorem <del>ipsum, dolor</del> met.</p>
  285. """.strip()
  286. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  287. self.assertEqual(expected_result, result['parsed_text'])
  288. class QuoteTests(TestCase):
  289. def test_quotes(self):
  290. """bbcode for quote is supported"""
  291. test_text = """
  292. Lorem ipsum.
  293. [quote]Dolor met[/quote]
  294. [quote]Dolor <b>met</b>[/quote]
  295. [quote]Dolor **met**[quote]Dolor met[/quote][/quote]
  296. """.strip()
  297. expected_result = """
  298. <p>Lorem ipsum.</p>
  299. <aside class="quote-block">
  300. <div class="quote-heading"></div>
  301. <blockquote class="quote-body">
  302. <p>Dolor met</p>
  303. </blockquote>
  304. </aside>
  305. <aside class="quote-block">
  306. <div class="quote-heading"></div>
  307. <blockquote class="quote-body">
  308. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  309. </blockquote>
  310. </aside>
  311. <aside class="quote-block">
  312. <div class="quote-heading"></div>
  313. <blockquote class="quote-body">
  314. <p>Dolor <strong>met</strong></p>
  315. <aside class="quote-block">
  316. <div class="quote-heading"></div>
  317. <blockquote class="quote-body">
  318. <p>Dolor met</p>
  319. </blockquote>
  320. </aside>
  321. </blockquote>
  322. </aside>
  323. """.strip()
  324. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  325. self.assertEqual(expected_result, result['parsed_text'])
  326. def test_authored_quotes(self):
  327. """bbcode for authored quote is supported and handles mentions as well"""
  328. test_text = """
  329. Lorem ipsum.
  330. [quote]Dolor met[/quote]
  331. [quote=\"@Bob\"]Dolor <b>met</b>[/quote]
  332. [quote]Dolor **met**[quote=@Bob]Dolor met[/quote][/quote]
  333. """.strip()
  334. expected_result = """
  335. <p>Lorem ipsum.</p>
  336. <aside class="quote-block">
  337. <div class="quote-heading"></div>
  338. <blockquote class="quote-body">
  339. <p>Dolor met</p>
  340. </blockquote>
  341. </aside>
  342. <aside class="quote-block">
  343. <div class="quote-heading">@Bob</div>
  344. <blockquote class="quote-body">
  345. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  346. </blockquote>
  347. </aside>
  348. <aside class="quote-block">
  349. <div class="quote-heading"></div>
  350. <blockquote class="quote-body">
  351. <p>Dolor <strong>met</strong></p>
  352. <aside class="quote-block">
  353. <div class="quote-heading">@Bob</div>
  354. <blockquote class="quote-body">
  355. <p>Dolor met</p>
  356. </blockquote>
  357. </aside>
  358. </blockquote>
  359. </aside>
  360. """.strip()
  361. request = MockRequest(user=MockPoster())
  362. result = parse(test_text, request, MockPoster(), minify=False)
  363. self.assertEqual(expected_result, result['parsed_text'])
  364. def test_custom_quote_title(self):
  365. """parser handles custom quotetitle"""
  366. test_text = """
  367. Lorem ipsum.
  368. [quote=\"Lorem ipsum very test\"]Dolor <b>met</b>[/quote]
  369. """.strip()
  370. expected_result = """
  371. <p>Lorem ipsum.</p>
  372. <aside class="quote-block">
  373. <div class="quote-heading">Lorem ipsum very test</div>
  374. <blockquote class="quote-body">
  375. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  376. </blockquote>
  377. </aside>
  378. """.strip()
  379. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  380. self.assertEqual(expected_result, result['parsed_text'])
  381. def test_hr_edge_case(self):
  382. """test for weird edge case in which hr gets moved outside of quote"""
  383. test_text = """
  384. Lorem ipsum.
  385. [quote]
  386. Dolor met
  387. - - - - -
  388. Amet elit
  389. [/quote]
  390. """.strip()
  391. expected_result = """
  392. <p>Lorem ipsum.</p>
  393. <aside class="quote-block">
  394. <div class="quote-heading"></div>
  395. <blockquote class="quote-body">
  396. <p>Dolor met</p>
  397. <hr/>
  398. <p>Amet elit</p>
  399. </blockquote>
  400. </aside>
  401. """.strip()
  402. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  403. self.assertEqual(expected_result, result['parsed_text'])
  404. class CodeTests(TestCase):
  405. def test_code(self):
  406. """code bbcode is correctly parsed"""
  407. test_text = """
  408. Lorem ipsum.
  409. [code]
  410. Dolor [b]met.[/b]
  411. [/code]
  412. """.strip()
  413. expected_result = """
  414. <p>Lorem ipsum.</p>
  415. <pre><code>Dolor [b]met.[/b]</code></pre>
  416. """.strip()
  417. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  418. self.assertEqual(expected_result, result['parsed_text'])
  419. def test_inline_code(self):
  420. """inline code bbcode is correctly parsed"""
  421. test_text = """
  422. Lorem ipsum.
  423. [code]Dolor [b]met.[/b][/code]
  424. """.strip()
  425. expected_result = """
  426. <p>Lorem ipsum.</p>
  427. <pre><code>Dolor [b]met.[/b]</code></pre>
  428. """.strip()
  429. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  430. self.assertEqual(expected_result, result['parsed_text'])
  431. def test_code_strip(self):
  432. """code bbcode trims its content"""
  433. test_text = """
  434. Lorem ipsum.
  435. [code]
  436. Dolor [b]met.[/b]
  437. [/code]
  438. """.strip()
  439. expected_result = """
  440. <p>Lorem ipsum.</p>
  441. <pre><code> Dolor [b]met.[/b]</code></pre>
  442. """.strip()
  443. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  444. self.assertEqual(expected_result, result['parsed_text'])
  445. def test_code_language(self):
  446. """code bbcode with language is correctly parsed"""
  447. test_text = """
  448. Lorem ipsum.
  449. [code="python"]
  450. Dolor [b]met.[/b]
  451. [/code]
  452. """.strip()
  453. expected_result = """
  454. <p>Lorem ipsum.</p>
  455. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  456. """.strip()
  457. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  458. self.assertEqual(expected_result, result['parsed_text'])
  459. def test_code_language_optional_quotes(self):
  460. """code quotes around language name are optional"""
  461. test_text = """
  462. Lorem ipsum.
  463. [code=python"]
  464. Dolor [b]met.[/b]
  465. [/code]
  466. """.strip()
  467. expected_result = """
  468. <p>Lorem ipsum.</p>
  469. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  470. """.strip()
  471. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  472. self.assertEqual(expected_result, result['parsed_text'])
  473. test_text = """
  474. Lorem ipsum.
  475. [code="python]
  476. Dolor [b]met.[/b]
  477. [/code]
  478. """.strip()
  479. expected_result = """
  480. <p>Lorem ipsum.</p>
  481. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  482. """.strip()
  483. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  484. self.assertEqual(expected_result, result['parsed_text'])