test_parser.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615
  1. # -*- coding: utf-8 -*-
  2. from __future__ import unicode_literals
  3. from django.contrib.auth import get_user_model
  4. from django.test import TestCase
  5. from misago.markup.parser import parse
  6. UserModel = get_user_model()
  7. class MockRequest(object):
  8. scheme = 'http'
  9. def __init__(self, user=None):
  10. self.user = user
  11. def get_host(self):
  12. return 'test.com'
  13. class MockPoster(object):
  14. username = 'LoremIpsum'
  15. slug = 'loremipsum'
  16. class HTMLTests(TestCase):
  17. def test_html_escaped(self):
  18. """parser escapes all html"""
  19. test_text = """
  20. Lorem <strong>ipsum!</strong>
  21. """.strip()
  22. expected_result = """
  23. <p>Lorem &lt;strong&gt;ipsum!&lt;/strong&gt;</p>
  24. """.strip()
  25. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  26. self.assertEqual(expected_result, result['parsed_text'])
  27. self.assertEqual(result['internal_links'], [])
  28. self.assertEqual(result['images'], [])
  29. self.assertEqual(result['outgoing_links'], [])
  30. class BBCodeTests(TestCase):
  31. def test_inline_text(self):
  32. """inline elements are correctly parsed"""
  33. test_text = """
  34. Lorem **ipsum**, dolor met.
  35. Lorem [b]ipsum[/b], [i]dolor[/i] [u]met[/u].
  36. Lorem [b]**ipsum**[/b] [i]dolor[/i] [u]met[/u].
  37. Lorem [b]**ipsum[/b]** [i]dolor[/i] [u]met[/u].
  38. Lorem [b]__ipsum[/b]__ [i]dolor[/i] [u]met[/u].
  39. Lorem [b][i]ipsum[/i][/b].
  40. Lorem [b][i]ipsum[/b][/i].
  41. Lorem [b]ipsum[/B].
  42. """.strip()
  43. expected_result = """
  44. <p>Lorem <strong>ipsum</strong>, dolor met.</p>
  45. <p>Lorem <b>ipsum</b>, <i>dolor</i> <u>met</u>.</p>
  46. <p>Lorem <b><strong>ipsum</strong></b> <i>dolor</i> <u>met</u>.</p>
  47. <p>Lorem <b>**ipsum</b>** <i>dolor</i> <u>met</u>.</p>
  48. <p>Lorem <b>__ipsum</b>__ <i>dolor</i> <u>met</u>.</p>
  49. <p>Lorem <b><i>ipsum</i></b>.</p>
  50. <p>Lorem <b>[i]ipsum</b>[/i].</p>
  51. <p>Lorem <b>ipsum</b>.</p>
  52. """.strip()
  53. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  54. self.assertEqual(expected_result, result['parsed_text'])
  55. def test_hr(self):
  56. """hr bbcode is correctly parsed"""
  57. test_text = """
  58. Lorem ipsum.
  59. [hr]
  60. Dolor met.
  61. """.strip()
  62. expected_result = """
  63. <p>Lorem ipsum.</p>
  64. <hr/>
  65. <p>Dolor met.</p>
  66. """.strip()
  67. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  68. self.assertEqual(expected_result, result['parsed_text'])
  69. def test_img(self):
  70. """img bbcode is correctly parsed"""
  71. test_text = """
  72. Lorem ipsum [img]https://placekitten.com/g/1200/500[/img]
  73. Lorem ipsum [iMg]https://placekitten.com/g/1200/500[/ImG]
  74. Lorem ipsum !(https://placekitten.com/g/1200/500)
  75. """.strip()
  76. expected_result = """
  77. <p>Lorem ipsum <img alt="placekitten.com/g/1200/500" src="https://placekitten.com/g/1200/500"/></p>
  78. <p>Lorem ipsum <img alt="placekitten.com/g/1200/500" src="https://placekitten.com/g/1200/500"/></p>
  79. <p>Lorem ipsum <img alt="placekitten.com/g/1200/500" src="https://placekitten.com/g/1200/500"/></p>
  80. """.strip()
  81. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  82. self.assertEqual(expected_result, result['parsed_text'])
  83. def test_url(self):
  84. """url bbcode is correctly parsed"""
  85. test_text = """
  86. Lorem ipsum [url]placekitten.com/g/300/300[/url]
  87. Lorem ipsum [url]https://placekitten.com/g/600/600[/url]
  88. Lorem ipsum [uRL=https://placekitten.com/g/400/400"]Label text![/UrL]
  89. Lorem ipsum [Lorem ipsum](https://placekitten.com/g/1200/500)
  90. """.strip()
  91. expected_result = """
  92. <p>Lorem ipsum <a href="http://placekitten.com/g/300/300" rel="nofollow">placekitten.com/g/300/300</a></p>
  93. <p>Lorem ipsum <a href="https://placekitten.com/g/600/600" rel="nofollow">placekitten.com/g/600/600</a></p>
  94. <p>Lorem ipsum <a href="https://placekitten.com/g/400/400" rel="nofollow">Label text!</a></p>
  95. <p>Lorem ipsum <a href="https://placekitten.com/g/1200/500" rel="nofollow">Lorem ipsum</a></p>
  96. """.strip()
  97. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  98. self.assertEqual(expected_result, result['parsed_text'])
  99. class MinifyTests(TestCase):
  100. def test_minified_text(self):
  101. """parser minifies text successfully"""
  102. test_text = """
  103. Lorem ipsum.
  104. Lorem ipsum.
  105. """.strip()
  106. expected_result = """
  107. <p>Lorem ipsum.</p><p>Lorem ipsum.</p>
  108. """.strip()
  109. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  110. self.assertEqual(expected_result, result['parsed_text'])
  111. def test_minified_unicode_text(self):
  112. """parser minifies unicode text successfully"""
  113. test_text = """
  114. Bżęczyszczykiewłicz ipsum.
  115. Lorem ipsum.
  116. """.strip()
  117. expected_result = """
  118. <p>Bżęczyszczykiewłicz ipsum.</p><p>Lorem ipsum.</p>
  119. """.strip()
  120. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  121. self.assertEqual(expected_result, result['parsed_text'])
  122. def test_complex_paragraph(self):
  123. """parser minifies complex paragraph"""
  124. user = UserModel.objects.create_user('Bob', 'bob@test.com', 'Pass123')
  125. test_text = """
  126. Hey there @{}, how's going?
  127. """.strip().format(user)
  128. expected_result = """
  129. <p>Hey there <a href="{}">@{}</a>, how's going?</p>
  130. """.strip().format(user.get_absolute_url(), user)
  131. result = parse(test_text, MockRequest(user), user, minify=True)
  132. self.assertEqual(expected_result, result['parsed_text'])
  133. class CleanLinksTests(TestCase):
  134. def test_clean_current_link(self):
  135. """clean_links step cleans http://test.com"""
  136. test_text = """
  137. Lorem ipsum: http://test.com
  138. """.strip()
  139. expected_result = """
  140. <p>Lorem ipsum: <a href="/">test.com</a></p>
  141. """.strip()
  142. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  143. self.assertEqual(expected_result, result['parsed_text'])
  144. self.assertEqual(result['internal_links'], ['/'])
  145. self.assertEqual(result['images'], [])
  146. self.assertEqual(result['outgoing_links'], [])
  147. def test_clean_schemaless_link(self):
  148. """clean_links step cleans test.com"""
  149. test_text = """
  150. Lorem ipsum: test.com
  151. """.strip()
  152. expected_result = """
  153. <p>Lorem ipsum: <a href="/">test.com</a></p>
  154. """.strip()
  155. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  156. self.assertEqual(expected_result, result['parsed_text'])
  157. self.assertEqual(result['internal_links'], ['/'])
  158. self.assertEqual(result['images'], [])
  159. self.assertEqual(result['outgoing_links'], [])
  160. def test_trim_current_path(self):
  161. """clean_links step leaves http://test.com path"""
  162. test_text = """
  163. Lorem ipsum: http://test.com/somewhere-something/
  164. """.strip()
  165. expected_result = """
  166. <p>Lorem ipsum: <a href="/somewhere-something/">test.com/somewhere-something/</a></p>
  167. """.strip()
  168. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  169. self.assertEqual(expected_result, result['parsed_text'])
  170. self.assertEqual(result['internal_links'], ['/somewhere-something/'])
  171. self.assertEqual(result['images'], [])
  172. self.assertEqual(result['outgoing_links'], [])
  173. def test_clean_outgoing_link_domain(self):
  174. """clean_links step leaves outgoing domain link"""
  175. test_text = """
  176. Lorem ipsum: http://somewhere.com
  177. """.strip()
  178. expected_result = """
  179. <p>Lorem ipsum: <a href="http://somewhere.com" rel="nofollow">somewhere.com</a></p>
  180. """.strip()
  181. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  182. self.assertEqual(expected_result, result['parsed_text'])
  183. self.assertEqual(result['outgoing_links'], ['somewhere.com'])
  184. self.assertEqual(result['images'], [])
  185. self.assertEqual(result['internal_links'], [])
  186. def test_trim_outgoing_path(self):
  187. """clean_links step leaves outgoing link domain and path"""
  188. test_text = """
  189. Lorem ipsum: http://somewhere.com/somewhere-something/
  190. """.strip()
  191. expected_result = """
  192. <p>Lorem ipsum: <a href="http://somewhere.com/somewhere-something/" rel="nofollow">somewhere.com/somewhere-something/</a></p>
  193. """.strip()
  194. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  195. self.assertEqual(expected_result, result['parsed_text'])
  196. self.assertEqual(result['outgoing_links'], ['somewhere.com/somewhere-something/'])
  197. self.assertEqual(result['images'], [])
  198. self.assertEqual(result['internal_links'], [])
  199. def test_clean_local_image_src(self):
  200. """clean_links step cleans local image src"""
  201. test_text = """
  202. !(http://test.com/image.jpg)
  203. """.strip()
  204. expected_result = """
  205. <p><img alt="test.com/image.jpg" src="/image.jpg"/></p>
  206. """.strip()
  207. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  208. self.assertEqual(expected_result, result['parsed_text'])
  209. self.assertEqual(result['images'], ['/image.jpg'])
  210. self.assertEqual(result['internal_links'], [])
  211. self.assertEqual(result['outgoing_links'], [])
  212. def test_clean_remote_image_src(self):
  213. """clean_links step cleans remote image src"""
  214. test_text = """
  215. !(http://somewhere.com/image.jpg)
  216. """.strip()
  217. expected_result = """
  218. <p><img alt="somewhere.com/image.jpg" src="http://somewhere.com/image.jpg"/></p>
  219. """.strip()
  220. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  221. self.assertEqual(expected_result, result['parsed_text'])
  222. self.assertEqual(result['images'], ['somewhere.com/image.jpg'])
  223. self.assertEqual(result['internal_links'], [])
  224. self.assertEqual(result['outgoing_links'], [])
  225. def test_clean_linked_image(self):
  226. """parser handles image element nested in link"""
  227. test_text = """
  228. [![3.png](http://test.com/a/thumb/test/43/)](http://test.com/a/test/43/)
  229. """.strip()
  230. expected_result = """
  231. <p><a href="/a/test/43/"><img alt="3.png" src="/a/thumb/test/43/"/></a></p>
  232. """.strip()
  233. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  234. self.assertEqual(expected_result, result['parsed_text'])
  235. self.assertEqual(result['images'], ['/a/thumb/test/43/'])
  236. self.assertEqual(result['internal_links'], ['/a/test/43/'])
  237. self.assertEqual(result['outgoing_links'], [])
  238. def test_force_shva(self):
  239. """parser appends ?shva=1 bit to attachment links if flag is present"""
  240. test_text = """
  241. ![3.png](http://test.com/a/thumb/test/43/)
  242. """.strip()
  243. expected_result = """
  244. <p><img alt="3.png" src="/a/thumb/test/43/?shva=1"/></p>
  245. """.strip()
  246. result = parse(test_text, MockRequest(), MockPoster(), minify=True, force_shva=True)
  247. self.assertEqual(expected_result, result['parsed_text'])
  248. self.assertEqual(result['images'], ['/a/thumb/test/43/'])
  249. self.assertEqual(result['internal_links'], [])
  250. self.assertEqual(result['outgoing_links'], [])
  251. def test_remove_shva(self):
  252. """parser removes ?shva=1 bit from attachment links if flag is absent"""
  253. test_text = """
  254. ![3.png](http://test.com/a/thumb/test/43/?shva=1)
  255. """.strip()
  256. expected_result = """
  257. <p><img alt="3.png" src="/a/thumb/test/43/"/></p>
  258. """.strip()
  259. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  260. self.assertEqual(expected_result, result['parsed_text'])
  261. self.assertEqual(result['images'], ['/a/thumb/test/43/?shva=1'])
  262. self.assertEqual(result['internal_links'], [])
  263. self.assertEqual(result['outgoing_links'], [])
  264. class LinkifyTests(TestCase):
  265. def test_clean_current_link(self):
  266. """clean_links step cleans http://test.com"""
  267. test_text = """
  268. Lorem ipsum: `<http://test.com>`
  269. """.strip()
  270. expected_result = """
  271. <p>Lorem ipsum: <code>&lt;http://test.com&gt;</code></p>
  272. """.strip()
  273. result = parse(test_text, MockRequest(), MockPoster(), minify=True)
  274. self.assertEqual(expected_result, result['parsed_text'])
  275. self.assertEqual(result['internal_links'], [])
  276. self.assertEqual(result['images'], [])
  277. self.assertEqual(result['outgoing_links'], [])
  278. class StriketroughTests(TestCase):
  279. def test_striketrough(self):
  280. """striketrough markdown deletes test"""
  281. test_text = """
  282. Lorem ~~ipsum, dolor~~ met.
  283. """.strip()
  284. expected_result = """
  285. <p>Lorem <del>ipsum, dolor</del> met.</p>
  286. """.strip()
  287. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  288. self.assertEqual(expected_result, result['parsed_text'])
  289. class QuoteTests(TestCase):
  290. def test_quotes(self):
  291. """bbcode for quote is supported"""
  292. test_text = """
  293. Lorem ipsum.
  294. [quote]Dolor met[/quote]
  295. [quote]Dolor <b>met</b>[/quote]
  296. [quote]Dolor **met**[quote]Dolor met[/quote][/quote]
  297. """.strip()
  298. expected_result = """
  299. <p>Lorem ipsum.</p>
  300. <aside class="quote-block">
  301. <div class="quote-heading"></div>
  302. <blockquote class="quote-body">
  303. <p>Dolor met</p>
  304. </blockquote>
  305. </aside>
  306. <aside class="quote-block">
  307. <div class="quote-heading"></div>
  308. <blockquote class="quote-body">
  309. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  310. </blockquote>
  311. </aside>
  312. <aside class="quote-block">
  313. <div class="quote-heading"></div>
  314. <blockquote class="quote-body">
  315. <p>Dolor <strong>met</strong></p>
  316. <aside class="quote-block">
  317. <div class="quote-heading"></div>
  318. <blockquote class="quote-body">
  319. <p>Dolor met</p>
  320. </blockquote>
  321. </aside>
  322. </blockquote>
  323. </aside>
  324. """.strip()
  325. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  326. self.assertEqual(expected_result, result['parsed_text'])
  327. def test_authored_quotes(self):
  328. """bbcode for authored quote is supported and handles mentions as well"""
  329. test_text = """
  330. Lorem ipsum.
  331. [quote]Dolor met[/quote]
  332. [quote=\"@Bob\"]Dolor <b>met</b>[/quote]
  333. [quote]Dolor **met**[quote=@Bob]Dolor met[/quote][/quote]
  334. """.strip()
  335. expected_result = """
  336. <p>Lorem ipsum.</p>
  337. <aside class="quote-block">
  338. <div class="quote-heading"></div>
  339. <blockquote class="quote-body">
  340. <p>Dolor met</p>
  341. </blockquote>
  342. </aside>
  343. <aside class="quote-block">
  344. <div class="quote-heading">@Bob</div>
  345. <blockquote class="quote-body">
  346. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  347. </blockquote>
  348. </aside>
  349. <aside class="quote-block">
  350. <div class="quote-heading"></div>
  351. <blockquote class="quote-body">
  352. <p>Dolor <strong>met</strong></p>
  353. <aside class="quote-block">
  354. <div class="quote-heading">@Bob</div>
  355. <blockquote class="quote-body">
  356. <p>Dolor met</p>
  357. </blockquote>
  358. </aside>
  359. </blockquote>
  360. </aside>
  361. """.strip()
  362. request = MockRequest(user=MockPoster())
  363. result = parse(test_text, request, MockPoster(), minify=False)
  364. self.assertEqual(expected_result, result['parsed_text'])
  365. def test_custom_quote_title(self):
  366. """parser handles custom quotetitle"""
  367. test_text = """
  368. Lorem ipsum.
  369. [quote=\"Lorem ipsum very test\"]Dolor <b>met</b>[/quote]
  370. """.strip()
  371. expected_result = """
  372. <p>Lorem ipsum.</p>
  373. <aside class="quote-block">
  374. <div class="quote-heading">Lorem ipsum very test</div>
  375. <blockquote class="quote-body">
  376. <p>Dolor &lt;b&gt;met&lt;/b&gt;</p>
  377. </blockquote>
  378. </aside>
  379. """.strip()
  380. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  381. self.assertEqual(expected_result, result['parsed_text'])
  382. def test_hr_edge_case(self):
  383. """test for weird edge case in which hr gets moved outside of quote"""
  384. test_text = """
  385. Lorem ipsum.
  386. [quote]
  387. Dolor met
  388. - - - - -
  389. Amet elit
  390. [/quote]
  391. """.strip()
  392. expected_result = """
  393. <p>Lorem ipsum.</p>
  394. <aside class="quote-block">
  395. <div class="quote-heading"></div>
  396. <blockquote class="quote-body">
  397. <p>Dolor met</p>
  398. <hr/>
  399. <p>Amet elit</p>
  400. </blockquote>
  401. </aside>
  402. """.strip()
  403. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  404. self.assertEqual(expected_result, result['parsed_text'])
  405. class CodeTests(TestCase):
  406. def test_code(self):
  407. """code bbcode is correctly parsed"""
  408. test_text = """
  409. Lorem ipsum.
  410. [code]
  411. Dolor [b]met.[/b]
  412. [/code]
  413. """.strip()
  414. expected_result = """
  415. <p>Lorem ipsum.</p>
  416. <pre><code>Dolor [b]met.[/b]</code></pre>
  417. """.strip()
  418. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  419. self.assertEqual(expected_result, result['parsed_text'])
  420. def test_inline_code(self):
  421. """inline code bbcode is correctly parsed"""
  422. test_text = """
  423. Lorem ipsum.
  424. [code]Dolor [b]met.[/b][/code]
  425. """.strip()
  426. expected_result = """
  427. <p>Lorem ipsum.</p>
  428. <pre><code>Dolor [b]met.[/b]</code></pre>
  429. """.strip()
  430. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  431. self.assertEqual(expected_result, result['parsed_text'])
  432. def test_code_strip(self):
  433. """code bbcode trims its content"""
  434. test_text = """
  435. Lorem ipsum.
  436. [code]
  437. Dolor [b]met.[/b]
  438. [/code]
  439. """.strip()
  440. expected_result = """
  441. <p>Lorem ipsum.</p>
  442. <pre><code> Dolor [b]met.[/b]</code></pre>
  443. """.strip()
  444. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  445. self.assertEqual(expected_result, result['parsed_text'])
  446. def test_code_language(self):
  447. """code bbcode with language is correctly parsed"""
  448. test_text = """
  449. Lorem ipsum.
  450. [code="python"]
  451. Dolor [b]met.[/b]
  452. [/code]
  453. """.strip()
  454. expected_result = """
  455. <p>Lorem ipsum.</p>
  456. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  457. """.strip()
  458. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  459. self.assertEqual(expected_result, result['parsed_text'])
  460. def test_code_language_optional_quotes(self):
  461. """code quotes around language name are optional"""
  462. test_text = """
  463. Lorem ipsum.
  464. [code=python"]
  465. Dolor [b]met.[/b]
  466. [/code]
  467. """.strip()
  468. expected_result = """
  469. <p>Lorem ipsum.</p>
  470. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  471. """.strip()
  472. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  473. self.assertEqual(expected_result, result['parsed_text'])
  474. test_text = """
  475. Lorem ipsum.
  476. [code="python]
  477. Dolor [b]met.[/b]
  478. [/code]
  479. """.strip()
  480. expected_result = """
  481. <p>Lorem ipsum.</p>
  482. <pre><code class="python">Dolor [b]met.[/b]</code></pre>
  483. """.strip()
  484. result = parse(test_text, MockRequest(), MockPoster(), minify=False)
  485. self.assertEqual(expected_result, result['parsed_text'])