test_parser.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622
  1. from django.contrib.auth import get_user_model
  2. from django.test import TestCase
  3. from misago.markup.parser import parse
  4. User = get_user_model()
  5. class MockRequest(object):
  6. scheme = "http"
  7. def __init__(self, user=None):
  8. self.user = user
  9. def get_host(self):
  10. return "test.com"
  11. class MockPoster(object):
  12. username = "LoremIpsum"
  13. slug = "loremipsum"
  14. class HTMLTests(TestCase):
  15. def test_html_escaped(self):
  16. """parser escapes all html"""
  17. test_text = """
  18. Lorem <strong>ipsum!</strong>
  19. """.strip()
  20. expected_result = """
  21. <p>Lorem &lt;strong&gt;ipsum!&lt;/strong&gt;</p>
  22. """.strip()
  23. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  24. self.assertEqual(expected_result, result["parsed_text"])
  25. self.assertEqual(result["internal_links"], [])
  26. self.assertEqual(result["images"], [])
  27. self.assertEqual(result["outgoing_links"], [])
  28. class BBCodeTests(TestCase):
  29. def test_inline_text(self):
  30. """inline elements are correctly parsed"""
  31. test_text = """
  32. Lorem **ipsum**, dolor met.
  33. Lorem [b]ipsum[/b], [i]dolor[/i] [u]met[/u].
  34. Lorem [b]**ipsum**[/b] [i]dolor[/i] [u]met[/u].
  35. Lorem [b]**ipsum[/b]** [i]dolor[/i] [u]met[/u].
  36. Lorem [b]__ipsum[/b]__ [i]dolor[/i] [u]met[/u].
  37. Lorem [b][i]ipsum[/i][/b].
  38. Lorem [b][i]ipsum[/b][/i].
  39. Lorem [b]ipsum[/B].
  40. """.strip()
  41. expected_result = """
  42. <p>Lorem <strong>ipsum</strong>, dolor met.</p>
  43. <p>Lorem <b>ipsum</b>, <i>dolor</i> <u>met</u>.</p>
  44. <p>Lorem <b><strong>ipsum</strong></b> <i>dolor</i> <u>met</u>.</p>
  45. <p>Lorem <b>**ipsum</b>** <i>dolor</i> <u>met</u>.</p>
  46. <p>Lorem <b>__ipsum</b>__ <i>dolor</i> <u>met</u>.</p>
  47. <p>Lorem <b><i>ipsum</i></b>.</p>
  48. <p>Lorem <b>[i]ipsum</b>[/i].</p>
  49. <p>Lorem <b>ipsum</b>.</p>
  50. """.strip()
  51. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  52. self.assertEqual(expected_result, result["parsed_text"])
  53. def test_hr(self):
  54. """hr bbcode is correctly parsed"""
  55. test_text = """
  56. Lorem ipsum.
  57. [hr]
  58. Dolor met.
  59. """.strip()
  60. expected_result = """
  61. <p>Lorem ipsum.</p>
  62. <hr/>
  63. <p>Dolor met.</p>
  64. """.strip()
  65. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  66. self.assertEqual(expected_result, result["parsed_text"])
  67. def test_img(self):
  68. """img bbcode is correctly parsed"""
  69. test_text = """
  70. Lorem ipsum [img]https://placekitten.com/g/1200/500[/img]
  71. Lorem ipsum [iMg]https://placekitten.com/g/1200/500[/ImG]
  72. Lorem ipsum !(https://placekitten.com/g/1200/500)
  73. """.strip()
  74. expected_result = """
  75. <p>Lorem ipsum <img alt="placekitten.com/g/1200/500" src="https://placekitten.com/g/1200/500"/></p>
  76. <p>Lorem ipsum <img alt="placekitten.com/g/1200/500" src="https://placekitten.com/g/1200/500"/></p>
  77. <p>Lorem ipsum <img alt="placekitten.com/g/1200/500" src="https://placekitten.com/g/1200/500"/></p>
  78. """.strip()
  79. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  80. self.assertEqual(expected_result, result["parsed_text"])
  81. def test_url(self):
  82. """url bbcode is correctly parsed"""
  83. test_text = """
  84. Lorem ipsum [url]placekitten.com/g/300/300[/url]
  85. Lorem ipsum [url]https://placekitten.com/g/600/600[/url]
  86. Lorem ipsum [uRL=https://placekitten.com/g/400/400"]Label text![/UrL]
  87. Lorem ipsum [Lorem ipsum](https://placekitten.com/g/1200/500)
  88. """.strip()
  89. expected_result = """
  90. <p>Lorem ipsum <a href="http://placekitten.com/g/300/300" rel="nofollow noopener">placekitten.com/g/300/300</a></p>
  91. <p>Lorem ipsum <a href="https://placekitten.com/g/600/600" rel="nofollow noopener">placekitten.com/g/600/600</a></p>
  92. <p>Lorem ipsum <a href="https://placekitten.com/g/400/400" rel="nofollow noopener">Label text!</a></p>
  93. <p>Lorem ipsum <a href="https://placekitten.com/g/1200/500" rel="nofollow noopener">Lorem ipsum</a></p>
  94. """.strip()
  95. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  96. self.assertEqual(expected_result, result["parsed_text"])
  97. class MinifyTests(TestCase):
  98. def test_minified_text(self):
  99. """parser minifies text successfully"""
  100. test_text = """
  101. Lorem ipsum.
  102. Lorem ipsum.
  103. """.strip()
  104. expected_result = """
  105. <p>Lorem ipsum.</p><p>Lorem ipsum.</p>
  106. """.strip()
  107. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  108. self.assertEqual(expected_result, result["parsed_text"])
  109. def test_minified_unicode_text(self):
  110. """parser minifies unicode text successfully"""
  111. test_text = """
  112. Bżęczyszczykiewłicz ipsum.
  113. Lorem ipsum.
  114. """.strip()
  115. expected_result = """
  116. <p>Bżęczyszczykiewłicz ipsum.</p><p>Lorem ipsum.</p>
  117. """.strip()
  118. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  119. self.assertEqual(expected_result, result["parsed_text"])
  120. def test_complex_paragraph(self):
  121. """parser minifies complex paragraph"""
  122. user = User.objects.create_user("Bob", "bob@test.com", "Pass123")
  123. test_text = (
  124. """
  125. Hey there @%s, how's going?
  126. """.strip()
  127. % user
  128. )
  129. expected_result = """
  130. <p>Hey there <a href="%s">@%s</a>, how's going?</p>
  131. """.strip() % (
  132. user.get_absolute_url(),
  133. user,
  134. )
  135. result = parse(test_text, MockRequest(user), user, minify=True)
  136. self.assertEqual(expected_result, result["parsed_text"])
  137. class CleanLinksTests(TestCase):
  138. def test_clean_current_link(self):
  139. """clean_links step cleans http://test.com"""
  140. test_text = """
  141. Lorem ipsum: http://test.com
  142. """.strip()
  143. expected_result = """
  144. <p>Lorem ipsum: <a href="/">test.com</a></p>
  145. """.strip()
  146. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  147. self.assertEqual(expected_result, result["parsed_text"])
  148. self.assertEqual(result["internal_links"], ["/"])
  149. self.assertEqual(result["images"], [])
  150. self.assertEqual(result["outgoing_links"], [])
  151. def test_clean_schemaless_link(self):
  152. """clean_links step cleans test.com"""
  153. test_text = """
  154. Lorem ipsum: test.com
  155. """.strip()
  156. expected_result = """
  157. <p>Lorem ipsum: <a href="/">test.com</a></p>
  158. """.strip()
  159. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  160. self.assertEqual(expected_result, result["parsed_text"])
  161. self.assertEqual(result["internal_links"], ["/"])
  162. self.assertEqual(result["images"], [])
  163. self.assertEqual(result["outgoing_links"], [])
  164. def test_trim_current_path(self):
  165. """clean_links step leaves http://test.com path"""
  166. test_text = """
  167. Lorem ipsum: http://test.com/somewhere-something/
  168. """.strip()
  169. expected_result = """
  170. <p>Lorem ipsum: <a href="/somewhere-something/">test.com/somewhere-something/</a></p>
  171. """.strip()
  172. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  173. self.assertEqual(expected_result, result["parsed_text"])
  174. self.assertEqual(result["internal_links"], ["/somewhere-something/"])
  175. self.assertEqual(result["images"], [])
  176. self.assertEqual(result["outgoing_links"], [])
  177. def test_clean_outgoing_link_domain(self):
  178. """clean_links step leaves outgoing domain link"""
  179. test_text = """
  180. Lorem ipsum: http://somewhere.com
  181. """.strip()
  182. expected_result = """
  183. <p>Lorem ipsum: <a href="http://somewhere.com" rel="nofollow noopener">somewhere.com</a></p>
  184. """.strip()
  185. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  186. self.assertEqual(expected_result, result["parsed_text"])
  187. self.assertEqual(result["outgoing_links"], ["somewhere.com"])
  188. self.assertEqual(result["images"], [])
  189. self.assertEqual(result["internal_links"], [])
  190. def test_trim_outgoing_path(self):
  191. """clean_links step leaves outgoing link domain and path"""
  192. test_text = """
  193. Lorem ipsum: http://somewhere.com/somewhere-something/
  194. """.strip()
  195. expected_result = """
  196. <p>Lorem ipsum: <a href="http://somewhere.com/somewhere-something/" rel="nofollow noopener">somewhere.com/somewhere-something/</a></p>
  197. """.strip()
  198. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  199. self.assertEqual(expected_result, result["parsed_text"])
  200. self.assertEqual(
  201. result["outgoing_links"], ["somewhere.com/somewhere-something/"]
  202. )
  203. self.assertEqual(result["images"], [])
  204. self.assertEqual(result["internal_links"], [])
  205. def test_clean_local_image_src(self):
  206. """clean_links step cleans local image src"""
  207. test_text = """
  208. !(http://test.com/image.jpg)
  209. """.strip()
  210. expected_result = """
  211. <p><img alt="test.com/image.jpg" src="/image.jpg"/></p>
  212. """.strip()
  213. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  214. self.assertEqual(expected_result, result["parsed_text"])
  215. self.assertEqual(result["images"], ["/image.jpg"])
  216. self.assertEqual(result["internal_links"], [])
  217. self.assertEqual(result["outgoing_links"], [])
  218. def test_clean_remote_image_src(self):
  219. """clean_links step cleans remote image src"""
  220. test_text = """
  221. !(http://somewhere.com/image.jpg)
  222. """.strip()
  223. expected_result = """
  224. <p><img alt="somewhere.com/image.jpg" src="http://somewhere.com/image.jpg"/></p>
  225. """.strip()
  226. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  227. self.assertEqual(expected_result, result["parsed_text"])
  228. self.assertEqual(result["images"], ["somewhere.com/image.jpg"])
  229. self.assertEqual(result["internal_links"], [])
  230. self.assertEqual(result["outgoing_links"], [])
  231. def test_clean_linked_image(self):
  232. """parser handles image element nested in link"""
  233. test_text = """
  234. [![3.png](http://test.com/a/thumb/test/43/)](http://test.com/a/test/43/)
  235. """.strip()
  236. expected_result = """
  237. <p><a href="/a/test/43/"><img alt="3.png" src="/a/thumb/test/43/"/></a></p>
  238. """.strip()
  239. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  240. self.assertEqual(expected_result, result["parsed_text"])
  241. self.assertEqual(result["images"], ["/a/thumb/test/43/"])
  242. self.assertEqual(result["internal_links"], ["/a/test/43/"])
  243. self.assertEqual(result["outgoing_links"], [])
  244. def test_force_shva(self):
  245. """parser appends ?shva=1 bit to attachment links if flag is present"""
  246. test_text = """
  247. ![3.png](http://test.com/a/thumb/test/43/)
  248. """.strip()
  249. expected_result = """
  250. <p><img alt="3.png" src="/a/thumb/test/43/?shva=1"/></p>
  251. """.strip()
  252. result = parse(
  253. test_text, MockRequest(), MockPoster(), minify=True, force_shva=True
  254. )
  255. self.assertEqual(expected_result, result["parsed_text"])
  256. self.assertEqual(result["images"], ["/a/thumb/test/43/"])
  257. self.assertEqual(result["internal_links"], [])
  258. self.assertEqual(result["outgoing_links"], [])
  259. def test_remove_shva(self):
  260. """parser removes ?shva=1 bit from attachment links if flag is absent"""
  261. test_text = """
  262. ![3.png](http://test.com/a/thumb/test/43/?shva=1)
  263. """.strip()
  264. expected_result = """
  265. <p><img alt="3.png" src="/a/thumb/test/43/"/></p>
  266. """.strip()
  267. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  268. self.assertEqual(expected_result, result["parsed_text"])
  269. self.assertEqual(result["images"], ["/a/thumb/test/43/?shva=1"])
  270. self.assertEqual(result["internal_links"], [])
  271. self.assertEqual(result["outgoing_links"], [])
  272. class LinkifyTests(TestCase):
  273. def test_clean_current_link(self):
  274. """clean_links step cleans http://test.com"""
  275. test_text = """
  276. Lorem ipsum: `<http://test.com>`
  277. """.strip()
  278. expected_result = """
  279. <p>Lorem ipsum: <code>&lt;http://test.com&gt;</code></p>
  280. """.strip()
  281. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  282. self.assertEqual(expected_result, result["parsed_text"])
  283. self.assertEqual(result["internal_links"], [])
  284. self.assertEqual(result["images"], [])
  285. self.assertEqual(result["outgoing_links"], [])
  286. class StriketroughTests(TestCase):
  287. def test_striketrough(self):
  288. """striketrough markdown deletes test"""
  289. test_text = """
  290. Lorem ~~ipsum, dolor~~ met.
  291. """.strip()
  292. expected_result = """
  293. <p>Lorem <del>ipsum, dolor</del> met.</p>
  294. """.strip()
  295. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  296. self.assertEqual(expected_result, result["parsed_text"])
  297. class QuoteTests(TestCase):
  298. def test_quotes(self):
  299. """bbcode for quote is supported"""
  300. test_text = """
  301. Lorem ipsum.
  302. [quote]Dolor met[/quote]
  303. [quote]Dolor <b>met</b>[/quote]
  304. [quote]Dolor **met**[quote]Dolor met[/quote][/quote]
  305. """.strip()
  306. expected_result = """
  307. <p>Lorem ipsum.</p>
  308. <aside class="quote-block">
  309. <div class="quote-heading"></div>
  310. <blockquote class="quote-body">
  311. <p>Dolor met</p>
  312. </blockquote>
  313. </aside>
  314. <aside class="quote-block">
  315. <div class="quote-heading"></div>
  316. <blockquote class="quote-body">
  317. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  318. </blockquote>
  319. </aside>
  320. <aside class="quote-block">
  321. <div class="quote-heading"></div>
  322. <blockquote class="quote-body">
  323. <p>Dolor <strong>met</strong></p>
  324. <aside class="quote-block">
  325. <div class="quote-heading"></div>
  326. <blockquote class="quote-body">
  327. <p>Dolor met</p>
  328. </blockquote>
  329. </aside>
  330. </blockquote>
  331. </aside>
  332. """.strip()
  333. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  334. self.assertEqual(expected_result, result["parsed_text"])
  335. def test_authored_quotes(self):
  336. """bbcode for authored quote is supported and handles mentions as well"""
  337. test_text = """
  338. Lorem ipsum.
  339. [quote]Dolor met[/quote]
  340. [quote=\"@Bob\"]Dolor <b>met</b>[/quote]
  341. [quote]Dolor **met**[quote=@Bob]Dolor met[/quote][/quote]
  342. """.strip()
  343. expected_result = """
  344. <p>Lorem ipsum.</p>
  345. <aside class="quote-block">
  346. <div class="quote-heading"></div>
  347. <blockquote class="quote-body">
  348. <p>Dolor met</p>
  349. </blockquote>
  350. </aside>
  351. <aside class="quote-block">
  352. <div class="quote-heading">@Bob</div>
  353. <blockquote class="quote-body">
  354. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  355. </blockquote>
  356. </aside>
  357. <aside class="quote-block">
  358. <div class="quote-heading"></div>
  359. <blockquote class="quote-body">
  360. <p>Dolor <strong>met</strong></p>
  361. <aside class="quote-block">
  362. <div class="quote-heading">@Bob</div>
  363. <blockquote class="quote-body">
  364. <p>Dolor met</p>
  365. </blockquote>
  366. </aside>
  367. </blockquote>
  368. </aside>
  369. """.strip()
  370. request = MockRequest(user=MockPoster())
  371. result = parse(test_text, request, MockPoster(), minify=False)
  372. self.assertEqual(expected_result, result["parsed_text"])
  373. def test_custom_quote_title(self):
  374. """parser handles custom quotetitle"""
  375. test_text = """
  376. Lorem ipsum.
  377. [quote=\"Lorem ipsum very test\"]Dolor <b>met</b>[/quote]
  378. """.strip()
  379. expected_result = """
  380. <p>Lorem ipsum.</p>
  381. <aside class="quote-block">
  382. <div class="quote-heading">Lorem ipsum very test</div>
  383. <blockquote class="quote-body">
  384. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  385. </blockquote>
  386. </aside>
  387. """.strip()
  388. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  389. self.assertEqual(expected_result, result["parsed_text"])
  390. def test_hr_edge_case(self):
  391. """test for weird edge case in which hr gets moved outside of quote"""
  392. test_text = """
  393. Lorem ipsum.
  394. [quote]
  395. Dolor met
  396. - - - - -
  397. Amet elit
  398. [/quote]
  399. """.strip()
  400. expected_result = """
  401. <p>Lorem ipsum.</p>
  402. <aside class="quote-block">
  403. <div class="quote-heading"></div>
  404. <blockquote class="quote-body">
  405. <p>Dolor met</p>
  406. <hr/>
  407. <p>Amet elit</p>
  408. </blockquote>
  409. </aside>
  410. """.strip()
  411. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  412. self.assertEqual(expected_result, result["parsed_text"])
  413. class CodeTests(TestCase):
  414. def test_code(self):
  415. """code bbcode is correctly parsed"""
  416. test_text = """
  417. Lorem ipsum.
  418. [code]
  419. Dolor [b]met.[/b]
  420. [/code]
  421. """.strip()
  422. expected_result = """
  423. <p>Lorem ipsum.</p>
  424. <pre><code>Dolor [b]met.[/b]</code></pre>
  425. """.strip()
  426. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  427. self.assertEqual(expected_result, result["parsed_text"])
  428. def test_inline_code(self):
  429. """inline code bbcode is correctly parsed"""
  430. test_text = """
  431. Lorem ipsum.
  432. [code]Dolor [b]met.[/b][/code]
  433. """.strip()
  434. expected_result = """
  435. <p>Lorem ipsum.</p>
  436. <pre><code>Dolor [b]met.[/b]</code></pre>
  437. """.strip()
  438. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  439. self.assertEqual(expected_result, result["parsed_text"])
  440. def test_code_strip(self):
  441. """code bbcode trims its content"""
  442. test_text = """
  443. Lorem ipsum.
  444. [code]
  445. Dolor [b]met.[/b]
  446. [/code]
  447. """.strip()
  448. expected_result = """
  449. <p>Lorem ipsum.</p>
  450. <pre><code> Dolor [b]met.[/b]</code></pre>
  451. """.strip()
  452. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  453. self.assertEqual(expected_result, result["parsed_text"])
  454. def test_code_language(self):
  455. """code bbcode with language is correctly parsed"""
  456. test_text = """
  457. Lorem ipsum.
  458. [code="python"]
  459. Dolor [b]met.[/b]
  460. [/code]
  461. """.strip()
  462. expected_result = """
  463. <p>Lorem ipsum.</p>
  464. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  465. """.strip()
  466. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  467. self.assertEqual(expected_result, result["parsed_text"])
  468. def test_code_language_optional_quotes(self):
  469. """code quotes around language name are optional"""
  470. test_text = """
  471. Lorem ipsum.
  472. [code=python"]
  473. Dolor [b]met.[/b]
  474. [/code]
  475. """.strip()
  476. expected_result = """
  477. <p>Lorem ipsum.</p>
  478. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  479. """.strip()
  480. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  481. self.assertEqual(expected_result, result["parsed_text"])
  482. test_text = """
  483. Lorem ipsum.
  484. [code="python]
  485. Dolor [b]met.[/b]
  486. [/code]
  487. """.strip()
  488. expected_result = """
  489. <p>Lorem ipsum.</p>
  490. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  491. """.strip()
  492. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  493. self.assertEqual(expected_result, result["parsed_text"])