Files
piratepoet/lib/Newsletter/Links/Links.php

220 lines
7.4 KiB
PHP

<?php
namespace MailPoet\Newsletter\Links;
use MailPoet\Models\Subscriber;
use MailPoet\Router\Router;
use MailPoet\Router\Endpoints\Track as TrackEndpoint;
use MailPoet\Models\NewsletterLink;
use MailPoet\Newsletter\Shortcodes\Shortcodes;
use MailPoet\Util\Helpers;
use MailPoet\Util\Security;
class Links {
const DATA_TAG_CLICK = '[mailpoet_click_data]';
const DATA_TAG_OPEN = '[mailpoet_open_data]';
const LINK_TYPE_SHORTCODE = 'shortcode';
const LINK_TYPE_LINK = 'link';
static function process($content) {
$extracted_links = self::extract($content);
$processed_links = self::hash($extracted_links);
return self::replace($content, $extracted_links, $processed_links);
}
static function extract($content) {
$extracted_links = array();
// adopted from WP's wp_extract_urls() function & modified to work on hrefs
# match href=' or href="
$regex = '#(?:href.*?=.*?)(["\']?)('
# match http://
. '(?:([\w-]+:)?//?)'
# match everything except for special characters # until .
. '[^\s()<>]+'
. '[.]'
# conditionally match everything except for special characters after .
. '(?:'
. '\([\w\d]+\)|'
. '(?:'
. '[^`!()\[\]{}:;\'".,<>«»“”‘’\s]|'
. '(?:[:]\d+)?/?'
. ')+'
. ')'
. ')\\1#';
// extract shortcodes with [link:*] format
$shortcodes = new Shortcodes();
$shortcodes = $shortcodes->extract($content, $categories = array('link'));
if($shortcodes) {
$extracted_links = array_map(function($shortcode) {
return array(
'type' => Links::LINK_TYPE_SHORTCODE,
'html' => $shortcode,
'link' => $shortcode
);
}, $shortcodes);
}
// extract urls with href="url" format
preg_match_all($regex, $content, $matched_urls);
$matched_urls_count = count($matched_urls[0]);
if($matched_urls_count) {
for($index = 0; $index < $matched_urls_count; $index++) {
$extracted_links[] = array(
'type' => self::LINK_TYPE_LINK,
'html' => $matched_urls[0][$index],
'link' => $matched_urls[2][$index]
);
}
}
return array_unique($extracted_links, SORT_REGULAR);
}
static function hash($extracted_links) {
$processed_links = array();
foreach($extracted_links as $extracted_link) {
$hash = Security::generateHash();
// Use URL as a key to map between extracted and processed links
// regardless of their sequential position (useful for link skips etc.)
$key = $extracted_link['link'];
$processed_links[$key] = array(
'hash' => $hash,
'url' => $extracted_link['link'],
// replace link with a temporary data tag + hash
// it will be further replaced with the proper track API URL during sending
'processed_link' => self::DATA_TAG_CLICK . '-' . $hash
);
}
return $processed_links;
}
static function replace($content, $extracted_links, $processed_links) {
foreach($extracted_links as $key => $extracted_link) {
$key = $extracted_link['link'];
if(!($hasReplacement = isset($processed_links[$key]['processed_link']))) {
continue;
}
$processed_link = $processed_links[$key]['processed_link'];
// first, replace URL in the extracted HTML source with encoded link
$processed_link_html_source = str_replace(
$extracted_link['link'], $processed_link,
$extracted_link['html']
);
// second, replace original extracted HTML source with processed URL source
$content = str_replace(
$extracted_link['html'], $processed_link_html_source, $content
);
// third, replace text version URL with processed link: [description](url)
// regex is used to avoid replacing description URLs that are wrapped in round brackets
// i.e., <a href="http://google.com">(http://google.com)</a> => [(http://google.com)](http://processed_link)
$regex_escaped_extracted_link = preg_quote($extracted_link['link'], '/');
$content = preg_replace(
'/\[(.*?)\](\(' . $regex_escaped_extracted_link . '\))/',
'[$1](' . $processed_link . ')',
$content
);
// Clean up data used to generate a new link
unset($processed_links[$key]['processed_link']);
}
return array(
$content,
array_values($processed_links)
);
}
static function replaceSubscriberData(
$subscriber_id,
$queue_id,
$content,
$preview = false
) {
// match data tags
$subscriber = Subscriber::findOne($subscriber_id);
preg_match_all(self::getLinkRegex(), $content, $matches);
foreach($matches[1] as $index => $match) {
$hash = null;
if(preg_match('/-/', $match)) {
list(, $hash) = explode('-', $match);
}
$data = self::createUrlDataObject(
$subscriber->id,
$subscriber->email,
$queue_id,
$hash,
$preview
);
$router_action = ($matches[2][$index] === self::DATA_TAG_CLICK) ?
TrackEndpoint::ACTION_CLICK :
TrackEndpoint::ACTION_OPEN;
$link = Router::buildRequest(
TrackEndpoint::ENDPOINT,
$router_action,
$data
);
$content = str_replace($match, $link, $content);
}
return $content;
}
static function save(array $links, $newsletter_id, $queue_id) {
foreach($links as $link) {
if(empty($link['hash']) || empty($link['url'])) continue;
$newsletter_link = NewsletterLink::create();
$newsletter_link->newsletter_id = $newsletter_id;
$newsletter_link->queue_id = $queue_id;
$newsletter_link->hash = $link['hash'];
$newsletter_link->url = $link['url'];
$newsletter_link->save();
}
}
static function convertHashedLinksToShortcodesAndUrls($content, $queue_id, $convert_all = false) {
preg_match_all(self::getLinkRegex(), $content, $links);
$links = array_unique(Helpers::flattenArray($links));
foreach($links as $link) {
$link_hash = explode('-', $link);
if(!isset($link_hash[1])) continue;
$newsletter_link = NewsletterLink::where('hash', $link_hash[1])
->where('queue_id', $queue_id)
->findOne();
// convert either only link shortcodes or all hashes links if "convert all"
// option is specified
if($newsletter_link &&
(preg_match('/\[link:/', $newsletter_link->url) || $convert_all)
) {
$content = str_replace($link, $newsletter_link->url, $content);
}
}
return $content;
}
static function getLinkRegex() {
return sprintf(
'/((%s|%s)(?:-\w+)?)/',
preg_quote(self::DATA_TAG_CLICK),
preg_quote(self::DATA_TAG_OPEN)
);
}
static function createUrlDataObject(
$subscriber_id, $subscriber_email, $queue_id, $link_hash, $preview
) {
return array(
$subscriber_id,
Subscriber::generateToken($subscriber_email),
$queue_id,
$link_hash,
$preview
);
}
static function transformUrlDataObject($data) {
reset($data);
if(!is_int(key($data))) return $data;
$transformed_data = array();
$transformed_data['subscriber_id'] = (!empty($data[0])) ? $data[0] : false;
$transformed_data['subscriber_token'] = (!empty($data[1])) ? $data[1] : false;
$transformed_data['queue_id'] = (!empty($data[2])) ? $data[2] : false;
$transformed_data['link_hash'] = (!empty($data[3])) ? $data[3] : false;
$transformed_data['preview'] = (!empty($data[4])) ? $data[4] : false;
return $transformed_data;
}
}