src/Content/Text/Markdown.php

   1 <?php
   2
   3 /**
   4  * @file src/Content/Text/Markdown.php
   5  */
   6
   7 namespace Friendica\Content\Text;
   8
   9 use Friendica\BaseObject;
  10 use Friendica\Model\Contact;
  11 use Michelf\MarkdownExtra;
  12 use Friendica\Content\Text\HTML;
  13
  14 /**
  15  * Friendica-specific usage of Markdown
  16  *
  17  * @author Hypolite Petovan <mrpetovan@gmail.com>
  18  */
  19 class Markdown extends BaseObject
  20 {
  21         /**
  22          * Converts a Markdown string into HTML. The hardwrap parameter maximizes
  23          * compatibility with Diaspora in spite of the Markdown standard.
  24          *
  25          * @brief Converts a Markdown string into HTML
  26          * @param string $text
  27          * @param bool   $hardwrap
  28          * @return string
  29          */
  30         public static function convert($text, $hardwrap = true) {
  31                 $stamp1 = microtime(true);
  32
  33                 $MarkdownParser = new MarkdownExtra();
  34                 $MarkdownParser->hard_wrap = $hardwrap;
  35                 $html = $MarkdownParser->transform($text);
  36
  37                 self::getApp()->save_timestamp($stamp1, "parser");
  38
  39                 return $html;
  40         }
  41
  42         /**
  43          * @brief Callback function to replace a Diaspora style mention in a mention for Friendica
  44          *
  45          * @param array $match Matching values for the callback
  46          * @return string Replaced mention
  47          */
  48         private static function diasporaMention2BBCodeCallback($match)
  49         {
  50                 if ($match[2] == '') {
  51                         return;
  52                 }
  53
  54                 $data = Contact::getDetailsByAddr($match[2]);
  55
  56                 $name = $match[1];
  57
  58                 if ($name == '') {
  59                         $name = $data['name'];
  60                 }
  61
  62                 return '@[url=' . $data['url'] . ']' . $name . '[/url]';
  63         }
  64
  65         /*
  66          * we don't want to support a bbcode specific markdown interpreter
  67          * and the markdown library we have is pretty good, but provides HTML output.
  68          * So we'll use that to convert to HTML, then convert the HTML back to bbcode,
  69          * and then clean up a few Diaspora specific constructs.
  70          */
  71         public static function toBBCode($s)
  72         {
  73                 $s = html_entity_decode($s, ENT_COMPAT, 'UTF-8');
  74
  75                 // Handles single newlines
  76                 $s = str_replace("\r\n", "\n", $s);
  77                 $s = str_replace("\n", " \n", $s);
  78                 $s = str_replace("\r", " \n", $s);
  79
  80                 // Replace lonely stars in lines not starting with it with literal stars
  81                 $s = preg_replace('/^([^\*]+)\*([^\*]*)$/im', '$1\*$2', $s);
  82
  83                 // The parser cannot handle paragraphs correctly
  84                 $s = str_replace(['</p>', '<p>', '<p dir="ltr">'], ['<br>', '<br>', '<br>'], $s);
  85
  86                 // Escaping the hash tags
  87                 $s = preg_replace('/\#([^\s\#])/', '&#35;$1', $s);
  88
  89                 $s = self::convert($s);
  90
  91                 $regexp = "/@\{(?:([^\}]+?); )?([^\} ]+)\}/";
  92                 $s = preg_replace_callback($regexp, ['self', 'diasporaMention2BBCodeCallback'], $s);
  93
  94                 $s = str_replace('&#35;', '#', $s);
  95
  96                 $s = HTML::toBBCode($s);
  97
  98                 // protect the recycle symbol from turning into a tag, but without unescaping angles and naked ampersands
  99                 $s = str_replace('&#x2672;', html_entity_decode('&#x2672;', ENT_QUOTES, 'UTF-8'), $s);
 100
 101                 // Convert everything that looks like a link to a link
 102                 $s = preg_replace('/([^\]=]|^)(https?\:\/\/)([a-zA-Z0-9:\/\-?&;.=_~#%$!+,@]+(?<!,))/ism', '$1[url=$2$3]$2$3[/url]', $s);
 103
 104                 //$s = preg_replace("/([^\]\=]|^)(https?\:\/\/)(vimeo|youtu|www\.youtube|soundcloud)([a-zA-Z0-9\:\/\-\?\&\;\.\=\_\~\#\%\$\!\+\,]+)/ism", '$1[url=$2$3$4]$2$3$4[/url]',$s);
 105                 $s = BBCode::pregReplaceInTag('/\[url\=?(.*?)\]https?:\/\/www.youtube.com\/watch\?v\=(.*?)\[\/url\]/ism', '[youtube]$2[/youtube]', 'url', $s);
 106                 $s = BBCode::pregReplaceInTag('/\[url\=https?:\/\/www.youtube.com\/watch\?v\=(.*?)\].*?\[\/url\]/ism'   , '[youtube]$1[/youtube]', 'url', $s);
 107                 $s = BBCode::pregReplaceInTag('/\[url\=?(.*?)\]https?:\/\/vimeo.com\/([0-9]+)(.*?)\[\/url\]/ism'        , '[vimeo]$2[/vimeo]'    , 'url', $s);
 108                 $s = BBCode::pregReplaceInTag('/\[url\=https?:\/\/vimeo.com\/([0-9]+)\](.*?)\[\/url\]/ism'              , '[vimeo]$1[/vimeo]'    , 'url', $s);
 109
 110                 // remove duplicate adjacent code tags
 111                 $s = preg_replace('/(\[code\])+(.*?)(\[\/code\])+/ism', '[code]$2[/code]', $s);
 112
 113                 // Don't show link to full picture (until it is fixed)
 114                 $s = BBCode::scaleExternalImages($s, false);
 115
 116                 return $s;
 117         }
 118 }