-
Notifications
You must be signed in to change notification settings - Fork 676
/
TestOfPost.php
192 lines (165 loc) · 8.67 KB
/
TestOfPost.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
<?php
/**
*
* ThinkUp/tests/TestOfPost.php
*
* Copyright (c) 2009-2013 Gina Trapani
*
* LICENSE:
*
* This file is part of ThinkUp (http://thinkup.com).
*
* ThinkUp is free software: you can redistribute it and/or modify it under the terms of the GNU General Public
* License as published by the Free Software Foundation, either version 2 of the License, or (at your option) any
* later version.
*
* ThinkUp is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied
* warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License along with ThinkUp. If not, see
* <http://www.gnu.org/licenses/>.
*
* Test of Post class
*
* @license http://www.gnu.org/licenses/gpl.html
* @copyright 2009-2013 Gina Trapani
* @author Gina Trapani <ginatrapani[at]gmail[dot]com>
*/
require_once dirname(__FILE__).'/init.tests.php';
require_once THINKUP_WEBAPP_PATH.'_lib/extlib/simpletest/autorun.php';
require_once THINKUP_WEBAPP_PATH.'config.inc.php';
class TestOfPost extends ThinkUpBasicUnitTestCase {
public function testExtractURLs() {
$test_patterns = array (
"Introducing the ThinkUp developers mailing list http://bit.ly/gXpdUZ"=> array ('http://bit.ly/gXpdUZ'),
"http://j.mp/g2F037 good advice (Mad Men-illustrated) for women in tech"=> array ('http://j.mp/g2F037') ,
"blah blah blah http:///badurl.com d http://bit.ly and http://example.org"=> array ('http://bit.ly',
'http://example.org'),
"blah blah blah http:///badurl.com d HTTP://yo.com/exi.xml?hi=yes and http://example.org/blah/yoiadsf/934324/"
=> array ('HTTP://yo.com/exi.xml?hi=yes', 'http://example.org/blah/yoiadsf/934324/'),
"I bought the book at http://amazon.com. You should read it, too"=> array ('http://amazon.com'),
"So, Who's on first? check “http://culturalwormhole.blogspot.com/†for more."=>
array ('http://culturalwormhole.blogspot.com/'),
"We know all about that (http://friendoflou.com), but we're not impressed." =>
array ('http://friendoflou.com'),
"A more terse, yet still friendly introduction notme.com norme.com/ bit.ly/gXpdUZ and blah yo.com/exi".
".xml?hi=yes blah" => array ('http://bit.ly/gXpdUZ', 'http://yo.com/exi.xml?hi=yes'),
"tersely www.google.com notme.google.com www.nytimes.com"=> array ('http://www.google.com',
'http://www.nytimes.com'),
"would you believe this url? http://foo.com/more_(than)_one_(parens) " =>
array('http://foo.com/more_(than)_one_(parens)'),
"detects embedding <http://foo.com/blah_blah/> nicely <tag>http://example.com</tag>"
=> array('http://foo.com/blah_blah/', 'http://example.com'),
'"RT @someone doesnt screw up RTs with quotes that bookend a link like http://example.com"'
=> array('http://example.com'),
"This here's a t.co link enclosed by a curly brace http://t.co/2JVSpi5Ó"=> array ('http://t.co/2JVSpi5'));
foreach ($test_patterns as $test_text=>$expected_urls) {
$urls = Post::extractURLs($test_text);
$this->assertIdentical($expected_urls, $urls, $test_text.' %s');
$this->assertTrue(array_reduce(array_map('Utils::validateURL', $urls), 'TestOfPost::isAllTrue', true));
}
}
public static function isAllTrue($a, $b) {
return $a && $b;
}
public function testExtractMentions() {
$test_str = '@samwhoo woot yay win cake';
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@samwhoo');
$this->assertIdentical($mentions, $actual_mentions);
$test_str = '@samwhoo @anildash woot yay win cake';
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@samwhoo', '@anildash');
$this->assertIdentical($mentions, $actual_mentions);
$test_str = '@samwhoo @anildash @ginatrapani woot yay win cake';
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@samwhoo', '@anildash', '@ginatrapani');
$this->assertIdentical($mentions, $actual_mentions);
$test_str = 'woot yay win cake #game';
$mentions = Post::extractMentions($test_str);
$actual_mentions = array();
$this->assertIdentical($mentions, $actual_mentions);
$test_str = "@sam'whoo woot yay win cake";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@sam');
$this->assertIdentical($mentions, $actual_mentions);
$test_str = "@sam#whoo woot yay win cake";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@sam');
$this->assertIdentical($mentions, $actual_mentions);
$test_str = "@sam/whoo woot yay win cake";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@sam');
$this->assertIdentical($mentions, $actual_mentions);
$test_str = "@sam.whoo woot yay win cake";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@sam');
$this->assertIdentical($mentions, $actual_mentions);
$test_str = "@sam-whoo woot yay win cake";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@sam');
$this->assertIdentical($mentions, $actual_mentions);
// Tests below come from twitter-text-conformance
$test_str = "@1234 woot yay win cake";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@1234');
$this->assertIdentical($mentions, $actual_mentions);
$test_str = "ã®@usernameã«åˆ°ç€ã‚’å¾…ã£ã¦ã„ã‚‹";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@username');
$this->assertIdentical($mentions, $actual_mentions, "Extract mention in the middle of a Japanese tweet");
$test_str = "Current Status: @_@ (cc: @username)";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@username');
$this->assertIdentical($mentions, $actual_mentions, "DO NOT extract username ending in @");
$test_str = "@aliceìnheiro something something";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array();
$this->assertIdentical($mentions, $actual_mentions, "DO NOT extract username followed by accented latin
characters");
$test_str = "@username email me @test@example.com";
$mentions = Post::extractMentions($test_str);
$actual_mentions = array('@username');
$this->assertIdentical($mentions, $actual_mentions, "Extract lone metion but not @user@user (too close to an
email)");
}
public function testExtractHashtags() {
$test_str = '@samwhoo woot yay win #cake';
$hashtags = Post::extractHashtags($test_str);
$actual_hashtags = array('#cake');
$this->assertIdentical($hashtags, $actual_hashtags);
$test_str = '@samwhoo woot yay #win #cake';
$hashtags = Post::extractHashtags($test_str);
$actual_hashtags = array('#win', '#cake');
$this->assertIdentical($hashtags, $actual_hashtags);
$test_str = '@samwhoo woot #yay #win #cake';
$hashtags = Post::extractHashtags($test_str);
$actual_hashtags = array('#yay', '#win', '#cake');
$this->assertIdentical($hashtags, $actual_hashtags);
$test_str = '@samwhoo woot yay win cake';
$hashtags = Post::extractHashtags($test_str);
$actual_hashtags = array();
$this->assertIdentical($hashtags, $actual_hashtags);
$test_str = '@samwhoo woot yay win #ca-ke';
$hashtags = Post::extractHashtags($test_str);
$actual_hashtags = array('#ca');
$this->assertIdentical($hashtags, $actual_hashtags);
$test_str = '@samwhoo woot yay win #ca@ke';
$hashtags = Post::extractHashtags($test_str);
$actual_hashtags = array('#ca');
$this->assertIdentical($hashtags, $actual_hashtags);
$test_str = '@samwhoo woot yay win #ca.ke';
$hashtags = Post::extractHashtags($test_str);
$actual_hashtags = array('#ca');
$this->assertIdentical($hashtags, $actual_hashtags);
$test_str = "@samwhoo woot yay win #ca'ke";
$hashtags = Post::extractHashtags($test_str);
$actual_hashtags = array('#ca');
$this->assertIdentical($hashtags, $actual_hashtags);
$test_str = '@samwhoo woot yay win #ca/ke';
$hashtags = Post::extractHashtags($test_str);
$actual_hashtags = array('#ca');
$this->assertIdentical($hashtags, $actual_hashtags);
}
}