We are no longer offering accounts on this server. Consider https://gitlab.freedesktop.org/ as a place to host projects.

util.php 74.3 KB
Newer Older
1
<?php
Evan Prodromou's avatar
Evan Prodromou committed
2
/*
3
 * StatusNet - the distributed open-source microblogging tool
4
 * Copyright (C) 2008-2011, StatusNet, Inc.
Evan Prodromou's avatar
Evan Prodromou committed
5
 *
6 7 8 9
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU Affero General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
Evan Prodromou's avatar
Evan Prodromou committed
10
 *
11 12 13 14
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
Evan Prodromou's avatar
Evan Prodromou committed
15
 *
16 17 18 19
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 */

20
/* XXX: break up into separate modules (HTTP, user, files) */
21

22 23 24
/**
 * Show a server error.
 */
25 26
function common_server_error($msg, $code=500)
{
27 28
    $err = new ServerErrorAction($msg, $code);
    $err->showPage();
29 30
}

31 32 33
/**
 * Show a user error.
 */
34 35
function common_user_error($msg, $code=400)
{
36 37
    $err = new ClientErrorAction($msg, $code);
    $err->showPage();
38 39
}

40 41 42
/**
 * This should only be used at setup; processes switching languages
 * to send text to other users should use common_switch_locale().
43
 *
44 45 46 47
 * @param string $language Locale language code (optional; empty uses
 *                         current user's preference or site default)
 * @return mixed success
 */
48 49
function common_init_locale($language=null)
{
50 51 52 53 54
    if(!$language) {
        $language = common_language();
    }
    putenv('LANGUAGE='.$language);
    putenv('LANG='.$language);
55
    $ok =  setlocale(LC_ALL, $language . ".utf8",
56 57 58 59
                     $language . ".UTF8",
                     $language . ".utf-8",
                     $language . ".UTF-8",
                     $language);
60 61

    return $ok;
62 63
}

64 65 66
/**
 * Initialize locale and charset settings and gettext with our message catalog,
 * using the current user's language preference or the site default.
67
 *
68 69
 * This should generally only be run at framework initialization; code switching
 * languages at runtime should call common_switch_language().
70
 *
71 72
 * @access private
 */
73 74
function common_init_language()
{
75
    mb_internal_encoding('UTF-8');
76

77 78
    // Note that this setlocale() call may "fail" but this is harmless;
    // gettext will still select the right language.
79 80
    $language = common_language();
    $locale_set = common_init_locale($language);
Evan Prodromou's avatar
Evan Prodromou committed
81

82 83 84 85 86 87 88 89 90 91 92 93
    if (!$locale_set) {
        // The requested locale doesn't exist on the system.
        //
        // gettext seems very picky... We first need to setlocale()
        // to a locale which _does_ exist on the system, and _then_
        // we can set in another locale that may not be set up
        // (say, ga_ES for Galego/Galician) it seems to take it.
        //
        // For some reason C and POSIX which are guaranteed to work
        // don't do the job. en_US.UTF-8 should be there most of the
        // time, but not guaranteed.
        $ok = common_init_locale("en_US");
94 95
        if (!$ok && strtolower(substr(PHP_OS, 0, 3)) != 'win') {
            // Try to find a complete, working locale on Unix/Linux...
96 97 98 99 100 101 102 103 104 105 106
            // @fixme shelling out feels awfully inefficient
            // but I don't think there's a more standard way.
            $all = `locale -a`;
            foreach (explode("\n", $all) as $locale) {
                if (preg_match('/\.utf[-_]?8$/i', $locale)) {
                    $ok = setlocale(LC_ALL, $locale);
                    if ($ok) {
                        break;
                    }
                }
            }
107 108 109
        }
        if (!$ok) {
            common_log(LOG_ERR, "Unable to find a UTF-8 locale on this system; UI translations may not work.");
110 111 112 113
        }
        $locale_set = common_init_locale($language);
    }

114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139
    common_init_gettext();
}

/**
 * @access private
 */
function common_init_gettext()
{
    setlocale(LC_CTYPE, 'C');
    // So we do not have to make people install the gettext locales
    $path = common_config('site','locale_path');
    bindtextdomain("statusnet", $path);
    bind_textdomain_codeset("statusnet", "UTF-8");
    textdomain("statusnet");
}

/**
 * Switch locale during runtime, and poke gettext until it cries uncle.
 * Otherwise, sometimes it doesn't actually switch away from the old language.
 *
 * @param string $language code for locale ('en', 'fr', 'pt_BR' etc)
 */
function common_switch_locale($language=null)
{
    common_init_locale($language);

140
    setlocale(LC_CTYPE, 'C');
Siebrand Mazeland's avatar
Siebrand Mazeland committed
141
    // So we do not have to make people install the gettext locales
142 143
    $path = common_config('site','locale_path');
    bindtextdomain("statusnet", $path);
144 145
    bind_textdomain_codeset("statusnet", "UTF-8");
    textdomain("statusnet");
146 147
}

148 149
function common_timezone()
{
150 151 152 153 154 155
    if (common_logged_in()) {
        $user = common_current_user();
        if ($user->timezone) {
            return $user->timezone;
        }
    }
156

157
    return common_config('site', 'timezone');
158 159
}

160 161 162 163 164 165 166 167 168 169 170 171 172 173
function common_valid_language($lang)
{
    if ($lang) {
        // Validate -- we don't want to end up with a bogus code
        // left over from some old junk.
        foreach (common_config('site', 'languages') as $code => $info) {
            if ($info['lang'] == $lang) {
                return true;
            }
        }
    }
    return false;
}

174 175
function common_language()
{
176 177 178 179 180 181 182 183
    // Allow ?uselang=xx override, very useful for debugging
    // and helping translators check usage and context.
    if (isset($_GET['uselang'])) {
        $uselang = strval($_GET['uselang']);
        if (common_valid_language($uselang)) {
            return $uselang;
        }
    }
184

185 186
    // If there is a user logged in and they've set a language preference
    // then return that one...
187
    if (_have_config() && common_logged_in()) {
188
        $user = common_current_user();
189 190 191

        if (common_valid_language($user->language)) {
            return $user->language;
192
        }
193
    }
194

195 196
    // Otherwise, find the best match for the languages requested by the
    // user's browser...
Brion Vibber's avatar
Brion Vibber committed
197 198 199 200 201 202 203
    if (common_config('site', 'langdetect')) {
        $httplang = isset($_SERVER['HTTP_ACCEPT_LANGUAGE']) ? $_SERVER['HTTP_ACCEPT_LANGUAGE'] : null;
        if (!empty($httplang)) {
            $language = client_prefered_language($httplang);
            if ($language)
              return $language;
        }
204
    }
205

206 207
    // Finally, if none of the above worked, use the site's default...
    return common_config('site', 'language');
208
}
209

210 211 212
/**
 * Salted, hashed passwords are stored in the DB.
 */
213
function common_munge_password($password, Profile $profile=null)
214
{
215 216 217 218 219 220 221
    $hashed = null;

    if (Event::handle('StartHashPassword', array(&$hashed, $password, $profile))) {
        Event::handle('EndHashPassword', array(&$hashed, $password, $profile));
    }
    if (empty($hashed)) {
        throw new PasswordHashException();
222
    }
223 224

    return $hashed;
225 226
}

227 228 229
/**
 * Check if a username exists and has matching password.
 */
230 231
function common_check_user($nickname, $password)
{
232 233 234 235 236
    // empty nickname always unacceptable
    if (empty($nickname)) {
        return false;
    }

237 238 239
    $authenticatedUser = false;

    if (Event::handle('StartCheckPassword', array($nickname, $password, &$authenticatedUser))) {
240 241

        if (common_is_email($nickname)) {
242
            $user = User::getKV('email', common_canonical_email($nickname));
243
        } else {
244
            $user = User::getKV('nickname', Nickname::normalize($nickname));
245 246
        }

247
        if ($user instanceof User && !empty($password)) {
248
            if (0 == strcmp(common_munge_password($password, $user->getProfile()), $user->password)) {
249 250
                //internal checking passed
                $authenticatedUser = $user;
Craig Andrews's avatar
Craig Andrews committed
251 252
            }
        }
253
    }
254
    Event::handle('EndCheckPassword', array($nickname, $password, $authenticatedUser));
255 256

    return $authenticatedUser;
257 258
}

259 260 261
/**
 * Is the current user logged in?
 */
262 263
function common_logged_in()
{
264
    return (!is_null(common_current_user()));
265 266
}

267 268
function common_have_session()
{
269
    return (0 != strcmp(session_id(), ''));
270 271
}

272 273
function common_ensure_session()
{
Evan Prodromou's avatar
Evan Prodromou committed
274
    $c = null;
275
    if (array_key_exists(session_name(), $_COOKIE)) {
Evan Prodromou's avatar
Evan Prodromou committed
276 277
        $c = $_COOKIE[session_name()];
    }
278
    if (!common_have_session()) {
279 280 281
        if (common_config('sessions', 'handle')) {
            Session::setSaveHandler();
        }
Evan Prodromou's avatar
Evan Prodromou committed
282 283 284 285 286 287 288 289
	if (array_key_exists(session_name(), $_GET)) {
	    $id = $_GET[session_name()];
	} else if (array_key_exists(session_name(), $_COOKIE)) {
	    $id = $_COOKIE[session_name()];
	}
	if (isset($id)) {
	    session_id($id);
	}
290
        @session_start();
Evan Prodromou's avatar
Evan Prodromou committed
291 292
        if (!isset($_SESSION['started'])) {
            $_SESSION['started'] = time();
Evan Prodromou's avatar
Evan Prodromou committed
293
            if (!empty($id)) {
Evan Prodromou's avatar
Evan Prodromou committed
294 295 296 297
                common_log(LOG_WARNING, 'Session cookie "' . $_COOKIE[session_name()] . '" ' .
                           ' is set but started value is null');
            }
        }
298
    }
299 300
}

301 302 303 304
// Three kinds of arguments:
// 1) a user object
// 2) a nickname
// 3) null to clear
305

306
// Initialize to false; set to null if none found
307 308
$_cur = false;

309 310
function common_set_user($user)
{
311 312
    global $_cur;

313 314 315 316 317 318
    if (is_null($user) && common_have_session()) {
        $_cur = null;
        unset($_SESSION['userid']);
        return true;
    } else if (is_string($user)) {
        $nickname = $user;
319
        $user = User::getKV('nickname', $nickname);
320
    } else if (!$user instanceof User) {
321 322 323 324
        return false;
    }

    if ($user) {
Craig Andrews's avatar
Craig Andrews committed
325
        if (Event::handle('StartSetUser', array(&$user))) {
326 327
            if (!empty($user)) {
                if (!$user->hasRight(Right::WEBLOGIN)) {
328
                    // TRANS: Authorisation exception thrown when a user a not allowed to login.
329 330
                    throw new AuthorizationException(_('Not allowed to log in.'));
                }
Craig Andrews's avatar
Craig Andrews committed
331 332 333 334 335 336 337
                common_ensure_session();
                $_SESSION['userid'] = $user->id;
                $_cur = $user;
                Event::handle('EndSetUser', array($user));
                return $_cur;
            }
        }
338 339
    }
    return false;
340 341
}

342 343
function common_set_cookie($key, $value, $expiration=0)
{
344 345
    $path = common_config('site', 'path');
    $server = common_config('site', 'server');
346

347 348 349 350 351 352 353 354 355
    if ($path && ($path != '/')) {
        $cookiepath = '/' . $path . '/';
    } else {
        $cookiepath = '/';
    }
    return setcookie($key,
                     $value,
                     $expiration,
                     $cookiepath,
356 357
                     $server,
                     common_config('site', 'ssl')=='always');
358 359 360
}

define('REMEMBERME', 'rememberme');
361
define('REMEMBERME_EXPIRY', 30 * 24 * 60 * 60); // 30 days
362

363 364
function common_rememberme($user=null)
{
365 366 367 368 369 370
    if (!$user) {
        $user = common_current_user();
        if (!$user) {
            return false;
        }
    }
371

372
    $rm = new Remember_me();
373

374
    $rm->code = common_random_hexstr(16);
375
    $rm->user_id = $user->id;
376

377
    // Wrap the insert in some good ol' fashioned transaction code
378 379 380

    $rm->query('BEGIN');

381
    $result = $rm->insert();
382

383 384
    if (!$result) {
        common_log_db_error($rm, 'INSERT', __FILE__);
385
        $rm->query('ROLLBACK');
386
        return false;
387 388
    }

389 390
    $rm->query('COMMIT');

391 392
    $cookieval = $rm->user_id . ':' . $rm->code;

393
    common_log(LOG_INFO, 'adding rememberme cookie "' . $cookieval . '" for ' . $user->nickname);
394

395
    common_set_cookie(REMEMBERME, $cookieval, time() + REMEMBERME_EXPIRY);
396

397
    return true;
398 399
}

400 401
function common_remembered_user()
{
402
    $user = null;
403

404
    $packed = isset($_COOKIE[REMEMBERME]) ? $_COOKIE[REMEMBERME] : null;
405

406 407
    if (!$packed) {
        return null;
408 409 410 411 412
    }

    list($id, $code) = explode(':', $packed);

    if (!$id || !$code) {
413
        common_log(LOG_WARNING, 'Malformed rememberme cookie: ' . $packed);
414
        common_forgetme();
415
        return null;
416 417
    }

418
    $rm = Remember_me::getKV('code', $code);
419 420

    if (!$rm) {
421
        common_log(LOG_WARNING, 'No such remember code: ' . $code);
422
        common_forgetme();
423
        return null;
424 425 426
    }

    if ($rm->user_id != $id) {
427
        common_log(LOG_WARNING, 'Rememberme code for wrong user: ' . $rm->user_id . ' != ' . $id);
428
        common_forgetme();
429
        return null;
430 431
    }

432
    $user = User::getKV('id', $rm->user_id);
433

434
    if (!$user instanceof User) {
435
        common_log(LOG_WARNING, 'No such user for rememberme: ' . $rm->user_id);
436
        common_forgetme();
437
        return null;
438 439
    }

440
    // successful!
441 442 443 444
    $result = $rm->delete();

    if (!$result) {
        common_log_db_error($rm, 'DELETE', __FILE__);
445
        common_log(LOG_WARNING, 'Could not delete rememberme: ' . $code);
446
        common_forgetme();
447
        return null;
448 449 450 451
    }

    common_log(LOG_INFO, 'logging in ' . $user->nickname . ' using rememberme code ' . $rm->code);

452
    common_set_user($user);
453 454
    common_real_login(false);

455 456
    // We issue a new cookie, so they can log in
    // automatically again after this session
457 458 459

    common_rememberme($user);

460
    return $user;
461 462
}

463 464 465
/**
 * must be called with a valid user!
 */
466 467
function common_forgetme()
{
468
    common_set_cookie(REMEMBERME, '', 0);
469 470
}

471 472 473
/**
 * Who is the current user?
 */
474 475
function common_current_user()
{
476 477
    global $_cur;

478 479 480 481
    if (!_have_config()) {
        return null;
    }

482 483
    if ($_cur === false) {

484 485
        if (isset($_COOKIE[session_name()]) || isset($_GET[session_name()])
            || (isset($_SESSION['userid']) && $_SESSION['userid'])) {
486 487 488
            common_ensure_session();
            $id = isset($_SESSION['userid']) ? $_SESSION['userid'] : false;
            if ($id) {
489 490
                $user = User::getKV('id', $id);
                if ($user instanceof User) {
491 492 493
                	$_cur = $user;
                	return $_cur;
                }
494 495 496
            }
        }

497
        // that didn't work; try to remember; will init $_cur to null on failure
498 499 500
        $_cur = common_remembered_user();

        if ($_cur) {
501
            // XXX: Is this necessary?
502 503 504 505
            $_SESSION['userid'] = $_cur->id;
        }
    }

506
    return $_cur;
507 508
}

509 510 511 512 513
/**
 * Logins that are 'remembered' aren't 'real' -- they're subject to
 * cookie-stealing. So, we don't let them do certain things. New reg,
 * OpenID, and password logins _are_ real.
 */
514 515
function common_real_login($real=true)
{
516 517
    common_ensure_session();
    $_SESSION['real_login'] = $real;
518 519
}

520 521
function common_is_real_login()
{
522
    return common_logged_in() && $_SESSION['real_login'];
523 524
}

525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547
/**
 * Get a hash portion for HTTP caching Etags and such including
 * info on the current user's session. If login/logout state changes,
 * or we've changed accounts, or we've renamed the current user,
 * we'll get a new hash value.
 *
 * This should not be considered secure information.
 *
 * @param User $user (optional; uses common_current_user() if left out)
 * @return string
 */
function common_user_cache_hash($user=false)
{
    if ($user === false) {
        $user = common_current_user();
    }
    if ($user) {
        return crc32($user->id . ':' . $user->nickname);
    } else {
        return '0';
    }
}

548 549 550 551 552
/**
 * get canonical version of nickname for comparison
 *
 * @param string $nickname
 * @return string
553 554 555
 *
 * @throws NicknameException on invalid input
 * @deprecated call Nickname::normalize() directly.
556
 */
557 558
function common_canonical_nickname($nickname)
{
559
    return Nickname::normalize($nickname);
560 561
}

562 563 564 565 566 567 568 569 570
/**
 * get canonical version of email for comparison
 *
 * @fixme actually normalize
 * @fixme reject invalid input
 *
 * @param string $email
 * @return string
 */
571 572
function common_canonical_email($email)
{
573 574 575
    // XXX: canonicalize UTF-8
    // XXX: lcase the domain part
    return $email;
576 577
}

578 579 580 581
function common_purify($html)
{
    require_once INSTALLDIR.'/extlib/htmLawed/htmLawed.php';

582 583
    $config = array('safe' => 1,    // means that elements=* means elements=*-applet-embed-iframe-object-script or so
                    'elements' => '*',
584 585
                    'deny_attribute' => 'id,style,on*');

586 587 588 589 590 591 592 593
    // Remove more elements than what the 'safe' filter gives (elements must be '*' before this)
    // http://www.bioinformatics.org/phplabware/internal_utilities/htmLawed/htmLawed_README.htm#s3.6
    foreach (common_config('htmlfilter') as $tag=>$filter) {
        if ($filter === true) {
            $config['elements'] .= "-{$tag}";
        }
    }

594 595 596 597 598 599 600 601 602 603 604 605
    $html = common_remove_unicode_formatting($html);

    return htmLawed($html, $config);
}

function common_remove_unicode_formatting($text)
{
    // Strip Unicode text formatting/direction codes
    // this is pretty dangerous for visualisation of text and can be used for mischief
    return preg_replace('/[\\x{200b}-\\x{200f}\\x{202a}-\\x{202e}]/u', '', $text);
}

606 607 608
/**
 * Partial notice markup rendering step: build links to !group references.
 *
609 610 611
 * @param string    $text partially rendered HTML
 * @param Profile   $author the Profile that is composing the current notice
 * @param Notice    $parent the Notice this is sent in reply to, if any
612 613
 * @return string partially rendered HTML
 */
614
function common_render_content($text, Profile $author, Notice $parent=null)
615
{
616
    $text = common_render_text($text);
617
    $text = common_linkify_mentions($text, $author, $parent);
618
    return $text;
619 620
}

621 622 623 624 625 626
/**
 * Finds @-mentions within the partially-rendered text section and
 * turns them into live links.
 *
 * Should generally not be called except from common_render_content().
 *
627 628 629
 * @param string    $text   partially-rendered HTML
 * @param Profile   $author the Profile that is composing the current notice
 * @param Notice    $parent the Notice this is sent in reply to, if any
630 631
 * @return string partially-rendered HTML
 */
632
function common_linkify_mentions($text, Profile $author, Notice $parent=null)
633
{
634
    $mentions = common_find_mentions($text, $author, $parent);
635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652

    // We need to go through in reverse order by position,
    // so our positions stay valid despite our fudging with the
    // string!

    $points = array();

    foreach ($mentions as $mention)
    {
        $points[$mention['position']] = $mention;
    }

    krsort($points);

    foreach ($points as $position => $mention) {

        $linkText = common_linkify_mention($mention);

653
        $text = substr_replace($text, $linkText, $position, $mention['length']);
654 655 656 657 658
    }

    return $text;
}

659
function common_linkify_mention(array $mention)
660 661 662 663 664 665 666 667
{
    $output = null;

    if (Event::handle('StartLinkifyMention', array($mention, &$output))) {

        $xs = new XMLStringer(false);

        $attrs = array('href' => $mention['url'],
mattl's avatar
mattl committed
668
                       'class' => 'h-card '.$mention['type']);
669 670 671 672 673

        if (!empty($mention['title'])) {
            $attrs['title'] = $mention['title'];
        }

mattl's avatar
mattl committed
674
        $xs->element('a', $attrs, $mention['text']);
675 676 677 678 679 680 681 682 683

        $output = $xs->getString();

        Event::handle('EndLinkifyMention', array($mention, &$output));
    }

    return $output;
}

684
function common_get_attentions($text, Profile $sender, Notice $parent=null)
685 686 687 688 689
{
    $mentions = common_find_mentions($text, $sender, $parent);
    $atts = array();
    foreach ($mentions as $mention) {
        foreach ($mention['mentioned'] as $mentioned) {
690
            $atts[$mentioned->getUri()] = $mentioned->getObjectType();
691 692
        }
    }
693 694 695 696 697
    if ($parent instanceof Notice) {
        $parentAuthor = $parent->getProfile();
        // afaik groups can't be authors
        $atts[$parentAuthor->getUri()] = ActivityObject::PERSON;
    }
698 699 700
    return $atts;
}

701
/**
702 703 704 705 706 707
 * Find @-mentions in the given text, using the given notice object as context.
 * References will be resolved with common_relative_profile() against the user
 * who posted the notice.
 *
 * Note the return data format is internal, to be used for building links and
 * such. Should not be used directly; rather, call common_linkify_mentions().
708
 *
709 710 711
 * @param string    $text
 * @param Profile   $sender the Profile that is sending the current text
 * @param Notice    $parent the Notice this text is in reply to, if any
712
 *
713
 * @return array
714 715
 *
 * @access private
716
 */
717
function common_find_mentions($text, Profile $sender, Notice $parent=null)
718
{
719 720
    $mentions = array();

721
    if (Event::handle('StartFindMentions', array($sender, $text, &$mentions))) {
722
        // Get the context of the original notice, if any
723
        $origMentions = array();
724

725 726 727
        // Does it have a parent notice for context?
        if ($parent instanceof Notice) {
            $ids = $parent->getReplies();   // replied-to _profile ids_
728 729 730 731 732 733 734 735

            foreach ($ids as $id) {
                try {
                    $repliedTo = Profile::getByID($id);
                    $origMentions[$repliedTo->getNickname()] = $repliedTo;
                } catch (NoResultException $e) {
                    // continue foreach
                }
736 737 738
            }
        }

739
        $matches = common_find_mentions_raw($text);
740 741

        foreach ($matches as $match) {
742 743 744 745 746 747
            try {
                $nickname = Nickname::normalize($match[0]);
            } catch (NicknameException $e) {
                // Bogus match? Drop it.
                continue;
            }
748 749 750 751 752

            // Try to get a profile for this nickname.
            // Start with conversation context, then go to
            // sender context.

753 754
            if ($parent instanceof Notice && $parent->getProfile()->getNickname() === $nickname) {
                $mentioned = $parent->getProfile();
755 756 757
            } else if (!empty($origMentions) &&
                       array_key_exists($nickname, $origMentions)) {
                $mentioned = $origMentions[$nickname];
758
            } else {
759
                // sets to null if no match
760 761
                $mentioned = common_relative_profile($sender, $nickname);
            }
762

763
            if ($mentioned instanceof Profile) {
764
                $user = User::getKV('id', $mentioned->id);
765

766 767 768 769
                try {
                    $url = $mentioned->getUrl();
                } catch (InvalidUrlException $e) {
                    $url = common_local_url('userbyid', array('id' => $mentioned->getID()));
770 771 772
                }

                $mention = array('mentioned' => array($mentioned),
773
                                 'type' => 'mention',
774 775
                                 'text' => $match[0],
                                 'position' => $match[1],
776
                                 'length' => mb_strlen($match[0]),
777
                                 'title' => $mentioned->getFullname(),
778 779 780 781 782 783 784 785 786
                                 'url' => $url);

                $mentions[] = $mention;
            }
        }

        // @#tag => mention of all subscriptions tagged 'tag'

        preg_match_all('/(?:^|[\s\.\,\:\;]+)@#([\pL\pN_\-\.]{1,64})/',
787
                       $text, $hmatches, PREG_OFFSET_CAPTURE);
788 789
        foreach ($hmatches[1] as $hmatch) {
            $tag = common_canonical_tag($hmatch[0]);
790
            $plist = Profile_list::getByTaggerAndTag($sender->getID(), $tag);
791 792 793 794
            if (!$plist instanceof Profile_list || $plist->private) {
                continue;
            }
            $tagged = $sender->getTaggedSubscribers($tag);
795

796
            $url = common_local_url('showprofiletag',
797
                                    array('nickname' => $sender->getNickname(),
798 799 800
                                          'tag' => $tag));

            $mentions[] = array('mentioned' => $tagged,
801
                                'type'      => 'list',
802 803
                                'text' => $hmatch[0],
                                'position' => $hmatch[1],
804
                                'length' => mb_strlen($hmatch[0]),
805 806
                                'url' => $url);
        }
807

808 809 810 811 812 813 814 815
        preg_match_all('/(?:^|[\s\.\,\:\;]+)!(' . Nickname::DISPLAY_FMT . ')/',
                       $text, $hmatches, PREG_OFFSET_CAPTURE);
        foreach ($hmatches[1] as $hmatch) {
            $nickname = Nickname::normalize($hmatch[0]);
            $group = User_group::getForNickname($nickname, $sender);

            if (!$group instanceof User_group || !$sender->isMember($group)) {
                continue;
816
            }
817 818 819

            $profile = $group->getProfile();

820
            $mentions[] = array('mentioned' => array($profile),
821
                                'type'      => 'group',
822 823
                                'text'      => $hmatch[0],
                                'position'  => $hmatch[1],
824
                                'length'    => mb_strlen($hmatch[0]),
825
                                'url'       => $group->permalink(),
826
                                'title'     => $group->getFancyName());
827 828 829 830 831 832 833 834
        }

        Event::handle('EndFindMentions', array($sender, $text, &$mentions));
    }

    return $mentions;
}

835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859
/**
 * Does the actual regex pulls to find @-mentions in text.
 * Should generally not be called directly; for use in common_find_mentions.
 *
 * @param string $text
 * @return array of PCRE match arrays
 */
function common_find_mentions_raw($text)
{
    $tmatches = array();
    preg_match_all('/^T (' . Nickname::DISPLAY_FMT . ') /',
                   $text,
                   $tmatches,
                   PREG_OFFSET_CAPTURE);

    $atmatches = array();
    preg_match_all('/(?:^|\s+)@(' . Nickname::DISPLAY_FMT . ')\b/',
                   $text,
                   $atmatches,
                   PREG_OFFSET_CAPTURE);

    $matches = array_merge($tmatches[1], $atmatches[1]);
    return $matches;
}

860 861
function common_render_text($text)
{
862 863
    $text = common_remove_unicode_formatting($text);
    $text = nl2br(htmlspecialchars($text));
864

865 866 867 868
    $text = preg_replace('/[\x{0}-\x{8}\x{b}-\x{c}\x{e}-\x{19}]/', '', $text);
    $text = common_replace_urls_callback($text, 'common_linkify');
    $text = preg_replace_callback('/(^|\&quot\;|\'|\(|\[|\{|\s+)#([\pL\pN_\-\.]{1,64})/u',
                function ($m) { return "{$m[1]}#".common_tag_link($m[2]); }, $text);
869
    // XXX: machine tags
870
    return $text;
Evan Prodromou's avatar
Evan Prodromou committed
871 872
}

873 874 875 876 877 878 879 880
/**
 * Find links in the given text and pass them to the given callback function.
 *
 * @param string $text
 * @param function($text, $arg) $callback: return replacement text
 * @param mixed $arg: optional argument will be passed on to the callback
 */
function common_replace_urls_callback($text, $callback, $arg = null) {
881
    // Start off with a regex
882
    $regex = '#'.
883
    '(?:^|[\s\<\>\(\)\[\]\{\}\\\'\\\";]+)(?![\@\!\#])'.
884
    '('.
885
        '(?:'.
886 887
            '(?:'. //Known protocols
                '(?:'.
888
                    '(?:(?:https?|ftps?|mms|rtsp|gopher|news|nntp|telnet|wais|file|prospero|webcal|ircs?)://)'.
889
                    '|'.
890 891
                    '(?:(?:mailto|aim|tel|xmpp):)'.
                ')'.
892
                '(?:[\pN\pL\-\_\+\%\~]+(?::[\pN\pL\-\_\+\%\~]+)?\@)?'. //user:pass@
893 894 895 896 897 898
                '(?:'.
                    '(?:'.
                        '\[[\pN\pL\-\_\:\.]+(?<![\.\:])\]'. //[dns]
                    ')|(?:'.
                        '[\pN\pL\-\_\:\.]+(?<![\.\:])'. //dns
                    ')'.
899
                ')'.
900
            ')'.
mattl's avatar
mattl committed
901
            '|(?:(?:magnet):)'. // URLs without domain name
902
            '|(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)'. //IPv4
903
            '|(?:'. //IPv6
904
                '\[?(?:(?:(?:[0-9A-Fa-f]{1,4}:){7}(?:(?:[0-9A-Fa-f]{1,4})|:))|(?:(?:[0-9A-Fa-f]{1,4}:){6}(?::|(?:(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})(?:\.(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})){3})|(?::[0-9A-Fa-f]{1,4})))|(?:(?:[0-9A-Fa-f]{1,4}:){5}(?:(?::(?:(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})(?:\.(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})){3})?)|(?:(?::[0-9A-Fa-f]{1,4}){1,2})))|(?:(?:[0-9A-Fa-f]{1,4}:){4}(?::[0-9A-Fa-f]{1,4}){0,1}(?:(?::(?:(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})(?:\.(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})){3})?)|(?:(?::[0-9A-Fa-f]{1,4}){1,2})))|(?:(?:[0-9A-Fa-f]{1,4}:){3}(?::[0-9A-Fa-f]{1,4}){0,2}(?:(?::(?:(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})(?:\.(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})){3})?)|(?:(?::[0-9A-Fa-f]{1,4}){1,2})))|(?:(?:[0-9A-Fa-f]{1,4}:){2}(?::[0-9A-Fa-f]{1,4}){0,3}(?:(?::(?:(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})(?:\.(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})){3})?)|(?:(?::[0-9A-Fa-f]{1,4}){1,2})))|(?:(?:[0-9A-Fa-f]{1,4}:)(?::[0-9A-Fa-f]{1,4}){0,4}(?:(?::(?:(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})(?:\.(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})){3})?)|(?:(?::[0-9A-Fa-f]{1,4}){1,2})))|(?::(?::[0-9A-Fa-f]{1,4}){0,5}(?:(?::(?:(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})(?:\.(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})){3})?)|(?:(?::[0-9A-Fa-f]{1,4}){1,2})))|(?:(?:(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})(?:\.(?:25[0-5]|2[0-4]\d|[01]?\d{1,2})){3})))\]?(?<!:)'.
mattl's avatar
mattl committed
905 906 907 908 909 910 911 912 913
            ')'.
            (common_config('linkify', 'bare_domains')
                ? '|(?:'. //DNS
                    '(?:[\pN\pL\-\_\+\%\~]+(?:\:[\pN\pL\-\_\+\%\~]+)?\@)?'. //user:pass@
                    '[\pN\pL\-\_]+(?:\.[\pN\pL\-\_]+)*\.'.
                    //tld list from http://data.iana.org/TLD/tlds-alpha-by-domain.txt, also added local, loc, and onion
                    '(?:AC|AD|AE|AERO|AF|AG|AI|AL|AM|AN|AO|AQ|AR|ARPA|AS|ASIA|AT|AU|AW|AX|AZ|BA|BB|BD|BE|BF|BG|BH|BI|BIZ|BJ|BM|BN|BO|BR|BS|BT|BV|BW|BY|BZ|CA|CAT|CC|CD|CF|CG|CH|CI|CK|CL|CM|CN|CO|COM|COOP|CR|CU|CV|CX|CY|CZ|DE|DJ|DK|DM|DO|DZ|EC|EDU|EE|EG|ER|ES|ET|EU|FI|FJ|FK|FM|FO|FR|GA|GB|GD|GE|GF|GG|GH|GI|GL|GM|GN|GOV|GP|GQ|GR|GS|GT|GU|GW|GY|HK|HM|HN|HR|HT|HU|ID|IE|IL|IM|IN|INFO|INT|IO|IQ|IR|IS|IT|JE|JM|JO|JOBS|JP|KE|KG|KH|KI|KM|KN|KP|KR|KW|KY|KZ|LA|LB|LC|LI|LK|LR|LS|LT|LU|LV|LY|MA|MC|MD|ME|MG|MH|MIL|MK|ML|MM|MN|MO|MOBI|MP|MQ|MR|MS|MT|MU|MUSEUM|MV|MW|MX|MY|MZ|NA|NAME|NC|NE|NET|NF|NG|NI|NL|NO|NP|NR|NU|NZ|OM|ORG|PA|PE|PF|PG|PH|PK|PL|PM|PN|PR|PRO|PS|PT|PW|PY|QA|RE|RO|RS|RU|RW|SA|SB|SC|SD|SE|SG|SH|SI|SJ|SK|SL|SM|SN|SO|SR|ST|SU|SV|SY|SZ|TC|TD|TEL|TF|TG|TH|TJ|TK|TL|TM|TN|TO|TP|TR|TRAVEL|TT|TV|TW|TZ|UA|UG|UK|US|UY|UZ|VA|VC|VE|VG|VI|VN|VU|WF|WS|XN--0ZWM56D|测试|XN--11B5BS3A9AJ6G|परीक्षा|XN--80AKHBYKNJ4F|испытание|XN--9T4B11YI5A|테스트|XN--DEBA0AD|טעסט|XN--G6W251D|測試|XN--HGBK6AJ7F53BBA|آزمایشی|XN--HLCJ6AYA9ESC7A|பரிட்சை|XN--JXALPDLP|δοκιμή|XN--KGBECHTV|إختبار|XN--ZCKZAH|テスト|YE|YT|YU|ZA|ZM|ZONE|ZW|local|loc|onion)'.
            ')(?![\pN\pL\-\_])'
                : '') . // if common_config('linkify', 'bare_domains') is false, don't add anything here
914
        ')'.
915
        '(?:'.
916
            '(?:\:\d+)?'. //:port
917 918 919
            '(?:/[\pN\pL$\,\!\(\)\.\:\-\_\+\/\=\&\;\%\~\*\$\+\'@]*)?'. // /path
            '(?:\?[\pN\pL\$\,\!\(\)\.\:\-\_\+\/\=\&\;\%\~\*\$\+\'@\/]*)?'. // ?query string
            '(?:\#[\pN\pL$\,\!\(\)\.\:\-\_\+\/\=\&\;\%\~\*\$\+\'\@/\?\#]*)?'. // #fragment
920
        ')(?<![\?\.\,\#\,])'.
921
    ')'.
922
    '#ixu';
923
    //preg_match_all($regex,$text,$matches);
924
    //print_r($matches);
925
    return preg_replace_callback($regex, curry('callback_helper',$callback,$arg) ,$text);
926
}
927

928 929 930 931 932 933 934 935
/**
 * Intermediate callback for common_replace_links(), helps resolve some
 * ambiguous link forms before passing on to the final callback.
 *
 * @param array $matches
 * @param callable $callback
 * @param mixed $arg optional argument to pass on as second param to callback
 * @return string
936
 *
937 938 939
 * @access private
 */
function callback_helper($matches, $callback, $arg=null) {
940
    $url=$matches[1];
941 942
    $left = strpos($matches[0],$url);
    $right = $left+strlen($url);
943

944 945 946 947 948 949 950 951 952 953 954 955
    $groupSymbolSets=array(
        array(
            'left'=>'(',
            'right'=>')'
        ),
        array(
            'left'=>'[',
            'right'=>']'
        ),
        array(
            'left'=>'{',
            'right'=>'}'
956 957 958 959
        ),
        array(
            'left'=>'<',
            'right'=>'>'
960 961 962 963 964 965 966 967 968 969 970 971 972 973 974 975 976 977 978 979 980
        )
    );
    $cannotEndWith=array('.','?',',','#');
    $original_url=$url;
    do{
        $original_url=$url;
        foreach($groupSymbolSets as $groupSymbolSet){
            if(substr($url,-1)==$groupSymbolSet['right']){
                $group_left_count = substr_count($url,$groupSymbolSet['left']);
                $group_right_count = substr_count($url,$groupSymbolSet['right']);
                if($group_left_count<$group_right_count){
                    $right-=1;
                    $url=substr($url,0,-1);
                }
            }
        }
        if(in_array(substr($url,-1),$cannotEndWith)){
            $right-=1;
            $url=substr($url,0,-1);
        }
    }while($original_url!=$url);
981

982
    $result = call_user_func_array($callback, array($url, $arg));
983
    return substr($matches[0],0,$left) . $result . substr($matches[0],$right);
984
}
985

986
require_once INSTALLDIR . "/lib/curry.php";
987 988

function common_linkify($url) {
Evan Prodromou's avatar
Evan Prodromou committed
989 990 991
    // It comes in special'd, so we unspecial it before passing to the stringifying
    // functions
    $url = htmlspecialchars_decode($url);
992

993 994 995 996 997
    if (strpos($url, '@') !== false && strpos($url, ':') === false && Validate::email($url)) {
        //url is an email address without the mailto: protocol
        $canon = "mailto:$url";
        $longurl = "mailto:$url";
    } else {
998
        $canon = File_redirection::_canonUrl($url);
999
        $longurl_data = File_redirection::where($canon, common_config('attachments', 'process_links'));
hannes's avatar
hannes committed
1000 1001 1002 1003 1004 1005 1006
        
        if(isset($longurl_data->redir_url)) {
			$longurl = $longurl_data->redir_url;
        } else {
            // e.g. local files
	        $longurl = $longurl_data->url;
        }
1007
    }
hannes's avatar
hannes committed
1008 1009
    
    $attrs = array('href' => $longurl, 'title' => $longurl);
1010

1011 1012 1013 1014
    $is_attachment = false;
    $attachment_id = null;
    $has_thumb = false;

1015
    // Check to see whether this is a known "attachment" URL.