class PorterStemmerInternalsUnitTest in Porter-Stemmer 7
Same name and namespace in other branches
- 6.2 porterstemmer.test \PorterStemmerInternalsUnitTest
Unit tests for Porter Stemmer - Stemming internals.
Hierarchy
- class \DrupalTestCase
- class \DrupalWebTestCase
Expanded class hierarchy of PorterStemmerInternalsUnitTest
File
- ./
porterstemmer.test, line 536 - Tests for the Porter Stemmer module. By Jennifer Hodgdon of Poplar ProductivityWare, www.poplarware.com Unit tests are based on sample words from http://snowball.tartarus.org/algorithms/english/stemmer.html which are stored in a separate file…
View source
class PorterStemmerInternalsUnitTest extends DrupalWebTestCase {
public static function getInfo() {
return array(
'name' => t('Stemming internals'),
'description' => t('Test that various algorithm steps and internal functions are working correctly'),
'group' => t('Porter Stemmer'),
);
}
public function setUp() {
parent::setUp('porterstemmer');
module_load_include('inc', 'porterstemmer', 'includes/standard-stemmer');
}
/**
* Verify that short words are not stemmed, and longer ones are.
*/
function testStemLength3UnitTest() {
// Words 3 letters or less should not be stemmed if min word length is 3
variable_set('minimum_word_size', 3);
porterstemmer_too_short('', TRUE);
$words = array(
'a' => 'a',
'at' => 'at',
'say' => 'say',
'fished' => 'fish',
'saying' => 'say',
);
foreach ($words as $in => $out) {
$stem = porterstemmer_stem($in);
$this
->assertEqual($out, $stem, "Stemming length 3 test for {$in} gives {$out} (was {$stem})", t('Stemming length'));
}
}
/**
* Verify that short words are not stemmed, and longer ones are.
*/
function testStemLength4UnitTest() {
// Words 4 letters or less should not be stemmed if min word length is 4
variable_set('minimum_word_size', 4);
porterstemmer_too_short('', TRUE);
$words = array(
'a' => 'a',
'at' => 'at',
'say' => 'say',
'fished' => 'fish',
'saying' => 'saying',
);
foreach ($words as $in => $out) {
$stem = porterstemmer_stem($in);
$this
->assertEqual($out, $stem, "Stemming length 4 test for {$in} gives {$out} (was {$stem})", t('Stemming length'));
}
}
/**
* Tests the function that determines if a word is "short".
*/
function testShortWord() {
// Test "shortness", using examples from algorithm web page,
// as well as several variations on the word "administ...".
variable_set('minimum_word_size', 2);
porterstemmer_too_short('', TRUE);
$this
->assertFalse(porterstemmer_short_word('administered', 2, 'Stemmer steps'), "administered should not be a short word");
$this
->assertFalse(porterstemmer_short_word('administer', 2, 'Stemmer steps'), "administer should not be a short word");
$this
->assertFalse(porterstemmer_short_word('admin', 2, 'Stemmer steps'), "admin should not be a short word");
$this
->assertTrue(porterstemmer_short_word('bed', 3, 'Stemmer steps'), "bed should be a short word");
$this
->assertTrue(porterstemmer_short_word('shed', 4, 'Stemmer steps'), "shed should be a short word");
$this
->assertTrue(porterstemmer_short_word('shred', 5, 'Stemmer steps'), "shred should be a short word");
$this
->assertFalse(porterstemmer_short_word('bead', 4, 'Stemmer steps'), "bead should not be a short word");
$this
->assertFalse(porterstemmer_short_word('beds', 3, 'Stemmer steps'), "beds should not be a short word");
$this
->assertFalse(porterstemmer_short_word('bake', 3, 'Stemmer steps'), "bake should not be a short word");
$this
->assertTrue(porterstemmer_short_word('bak', 3, 'Stemmer steps'), "bak should be a short word");
}
/**
* Test internal steps on the word "administered".
*/
function testAdministered() {
variable_set('minimum_word_size', 2);
porterstemmer_too_short('', TRUE);
$r1 = 0;
$r2 = 0;
$word = 'administered';
porterstemmer_prestemming($word, $r1, $r2);
// Test calculation of R1 and R2
$this
->assertEqual($r1, 2, "R1 for administered should be 2, was {$r1}", 'Stemmer steps');
$this
->assertEqual($r2, 5, "R2 for administered should be 5, was {$r2}", 'Stemmer steps');
// Test step 1b of the algorithm
porterstemmer_step1b($word, $r1);
$this
->assertEqual($word, 'administer', "Step1b should be administer, was {$word}", 'Stemmer steps');
// Test step 4 of the algorithm
porterstemmer_step4($word, $r2);
$this
->assertEqual($word, 'administ', "Step4 should be administ, was {$word}", 'Stemmer steps');
}
/**
* Test internal steps on the word "baked".
*/
function testBaked() {
variable_set('minimum_word_size', 2);
porterstemmer_too_short('', TRUE);
$r1 = 0;
$r2 = 0;
$word = 'baked';
porterstemmer_prestemming($word, $r1, $r2);
// Test calculation of R1 and R2
$this
->assertEqual($r1, 3, "R1 for baked should be 3, was {$r1}", 'Stemmer steps');
$this
->assertEqual($r2, 5, "R2 for baked should be 5, was {$r2}", 'Stemmer steps');
// Test step 1b of the algorithm
porterstemmer_step1b($word, $r1);
$this
->assertEqual($word, 'bake', "Step1b should be bake, was {$word}", 'Stemmer steps');
// Test step 5 of the algorithm
porterstemmer_step5($word, $r1, $r2);
$this
->assertEqual($word, 'bake', "Step5 should be bake, was {$word}", 'Stemmer steps');
}
/**
* Test internal steps on the word "geology".
*/
function testGeology() {
$r1 = 0;
$r2 = 0;
$word = 'geology';
variable_set('minimum_word_size', 2);
porterstemmer_too_short('', TRUE);
porterstemmer_prestemming($word, $r1, $r2);
// Test calculation of R1 and R2
$this
->assertEqual($r1, 4, "R1 for geology should be 4, was {$r1}", 'Stemmer steps');
$this
->assertEqual($r2, 6, "R2 for geology should be 6, was {$r2}", 'Stemmer steps');
// Test step 1c of the algorithm
porterstemmer_step1c($word);
$this
->assertEqual($word, 'geologi', "Step1c should be geologi, was {$word}", 'Stemmer steps');
// Test step 2 of the algorithm
porterstemmer_step2($word, $r1);
$this
->assertEqual($word, 'geolog', "Step2 should be geolog, was {$word}", 'Stemmer steps');
}
/**
* Test internal steps on the words "ies" and "ied".
*/
function testIesIed() {
$r1a = 0;
$r2a = 0;
$r1b = 0;
$r2b = 0;
$worda = 'ied';
$wordb = 'ies';
variable_set('minimum_word_size', 2);
porterstemmer_too_short('', TRUE);
porterstemmer_prestemming($worda, $r1a, $r2a);
porterstemmer_prestemming($wordb, $r1b, $r2b);
// Test step 1a of the algorithm
porterstemmer_step1a($worda);
porterstemmer_step1a($wordb);
$this
->assertEqual($worda, 'ie', "Step1a should be ie, was {$worda}", 'Stemmer steps');
$this
->assertEqual($wordb, 'ie', "Step1a should be ie, was {$wordb}", 'Stemmer steps');
}
/**
* Tests the excerpt function porterstemmer_sbp_excerpt_match().
*/
function testExcerpts() {
// Test with simple stemmed match.
$key = 'walking';
$text = 'I walked to the Grand Walks yesterday.';
$offset = 0;
$boundary = '[ ]+';
$result1 = porterstemmer_sbp_excerpt_match($key, $text, $offset, $boundary);
$this
->assertEqual($result1['where'], 2, 'Found match 1 in right place', 'Excerpt');
$this
->assertEqual($result1['keyword'], 'walked', 'Found right keyword for match 1', 'Excerpt');
// Test with upper-case in the keyword.
$result1b = porterstemmer_sbp_excerpt_match('waLk', $text, $offset, $boundary);
$this
->assertEqual($result1b['where'], 2, 'Found match 1b in right place', 'Excerpt');
$this
->assertEqual($result1b['keyword'], 'walked', 'Found right keyword for match 1b', 'Excerpt');
// Test with upper-case in the text.
$offset = 12;
$result2 = porterstemmer_sbp_excerpt_match($key, $text, $offset, $boundary);
$this
->assertEqual($result2['where'], 22, 'Found match 2 in right place', 'Excerpt');
$this
->assertEqual($result2['keyword'], 'Walks', 'Found right keyword for match 2', 'Excerpt');
// Test with a false match followed by a real match.
$text = 'I walknotawordhere to walk to school.';
$offset = 0;
$result3 = porterstemmer_sbp_excerpt_match($key, $text, $offset, $boundary);
$this
->assertEqual($result3['where'], 22, 'Found match 3 in right place', 'Excerpt');
$this
->assertEqual($result3['keyword'], 'walk', 'Found right keyword for match 3', 'Excerpt');
}
}
Members
Name | Modifiers | Type | Description | Overrides |
---|---|---|---|---|
DrupalTestCase:: |
protected | property | Assertions thrown in that test case. | |
DrupalTestCase:: |
protected | property | The database prefix of this test run. | |
DrupalTestCase:: |
protected | property | The original file directory, before it was changed for testing purposes. | |
DrupalTestCase:: |
public | property | Current results of this test case. | |
DrupalTestCase:: |
protected | property | Flag to indicate whether the test has been set up. | |
DrupalTestCase:: |
protected | property | ||
DrupalTestCase:: |
protected | property | ||
DrupalTestCase:: |
protected | property | This class is skipped when looking for the source of an assertion. | |
DrupalTestCase:: |
protected | property | The test run ID. | |
DrupalTestCase:: |
protected | property | Time limit for the test. | |
DrupalTestCase:: |
public | property | Whether to cache the installation part of the setUp() method. | |
DrupalTestCase:: |
public | property | Whether to cache the modules installation part of the setUp() method. | |
DrupalTestCase:: |
protected | property | URL to the verbose output file directory. | |
DrupalTestCase:: |
protected | function | Internal helper: stores the assert. | |
DrupalTestCase:: |
protected | function | Check to see if two values are equal. | |
DrupalTestCase:: |
protected | function | Check to see if a value is false (an empty string, 0, NULL, or FALSE). | |
DrupalTestCase:: |
protected | function | Check to see if two values are identical. | |
DrupalTestCase:: |
protected | function | Check to see if two values are not equal. | |
DrupalTestCase:: |
protected | function | Check to see if two values are not identical. | |
DrupalTestCase:: |
protected | function | Check to see if a value is not NULL. | |
DrupalTestCase:: |
protected | function | Check to see if a value is NULL. | |
DrupalTestCase:: |
protected | function | Check to see if a value is not false (not an empty string, 0, NULL, or FALSE). | |
DrupalTestCase:: |
public static | function | Delete an assertion record by message ID. | |
DrupalTestCase:: |
protected | function | Fire an error assertion. | 1 |
DrupalTestCase:: |
public | function | Handle errors during test runs. | 1 |
DrupalTestCase:: |
protected | function | Handle exceptions. | |
DrupalTestCase:: |
protected | function | Fire an assertion that is always negative. | |
DrupalTestCase:: |
public static | function | Converts a list of possible parameters into a stack of permutations. | |
DrupalTestCase:: |
protected | function | Cycles through backtrace until the first non-assertion method is found. | |
DrupalTestCase:: |
public static | function | Returns the database connection to the site running Simpletest. | |
DrupalTestCase:: |
public static | function | Store an assertion from outside the testing context. | |
DrupalTestCase:: |
protected | function | Fire an assertion that is always positive. | |
DrupalTestCase:: |
public static | function | Generates a random string containing letters and numbers. | |
DrupalTestCase:: |
public static | function | Generates a random string of ASCII characters of codes 32 to 126. | |
DrupalTestCase:: |
public | function | Run all tests in this class. | |
DrupalTestCase:: |
protected | function | Logs a verbose message in a text file. | |
DrupalWebTestCase:: |
protected | property | Additional cURL options. | |
DrupalWebTestCase:: |
protected | property | The content of the page currently loaded in the internal browser. | |
DrupalWebTestCase:: |
protected | property | The current cookie file used by cURL. | |
DrupalWebTestCase:: |
protected | property | The cookies of the page currently loaded in the internal browser. | |
DrupalWebTestCase:: |
protected | property | The handle of the current cURL connection. | |
DrupalWebTestCase:: |
protected | property | The value of the Drupal.settings JavaScript variable for the page currently loaded in the internal browser. | |
DrupalWebTestCase:: |
protected | property | The parsed version of the page. | |
DrupalWebTestCase:: |
protected | property | Whether the files were copied to the test files directory. | |
DrupalWebTestCase:: |
protected | property | The headers of the page currently loaded in the internal browser. | |
DrupalWebTestCase:: |
protected | property | HTTP authentication credentials (<username>:<password>). | |
DrupalWebTestCase:: |
protected | property | HTTP authentication method | |
DrupalWebTestCase:: |
protected | property | The current user logged in using the internal browser. | |
DrupalWebTestCase:: |
protected | property | The original shutdown handlers array, before it was cleaned for testing purposes. | |
DrupalWebTestCase:: |
protected | property | The original user, before it was changed to a clean uid = 1 for testing purposes. | |
DrupalWebTestCase:: |
protected | property | The content of the page currently loaded in the internal browser (plain text version). | |
DrupalWebTestCase:: |
protected | property | The profile to install as a basis for testing. | 20 |
DrupalWebTestCase:: |
protected | property | The number of redirects followed during the handling of a request. | |
DrupalWebTestCase:: |
protected | property | The current session ID, if available. | |
DrupalWebTestCase:: |
protected | property | The current session name, if available. | |
DrupalWebTestCase:: |
protected | property | The URL currently loaded in the internal browser. | |
DrupalWebTestCase:: |
protected | function | Asserts that a field exists with the given name or ID. | |
DrupalWebTestCase:: |
protected | function | Asserts that a field exists in the current page with the given ID and value. | |
DrupalWebTestCase:: |
protected | function | Asserts that a field exists in the current page with the given name and value. | |
DrupalWebTestCase:: |
protected | function | Asserts that a field exists in the current page by the given XPath. | |
DrupalWebTestCase:: |
protected | function | Asserts that a checkbox field in the current page is checked. | |
DrupalWebTestCase:: |
protected | function | Pass if a link with the specified label is found, and optional with the specified index. | |
DrupalWebTestCase:: |
protected | function | Pass if a link containing a given href (part) is found. | |
DrupalWebTestCase:: |
protected | function | Asserts that the most recently sent e-mail message has the given value. | |
DrupalWebTestCase:: |
protected | function | Asserts that the most recently sent e-mail message has the pattern in it. | |
DrupalWebTestCase:: |
protected | function | Asserts that the most recently sent e-mail message has the string in it. | |
DrupalWebTestCase:: |
protected | function | Asserts that each HTML ID is used for just a single element. | |
DrupalWebTestCase:: |
protected | function | Asserts that a field does not exist with the given name or ID. | |
DrupalWebTestCase:: |
protected | function | Asserts that a field does not exist with the given ID and value. | |
DrupalWebTestCase:: |
protected | function | Asserts that a field does not exist with the given name and value. | |
DrupalWebTestCase:: |
protected | function | Asserts that a field doesn't exist or its value doesn't match, by XPath. | |
DrupalWebTestCase:: |
protected | function | Asserts that a checkbox field in the current page is not checked. | |
DrupalWebTestCase:: |
protected | function | Pass if a link with the specified label is not found. | |
DrupalWebTestCase:: |
protected | function | Pass if a link containing a given href (part) is not found. | |
DrupalWebTestCase:: |
protected | function | Asserts that a select option in the current page is not checked. | |
DrupalWebTestCase:: |
protected | function | Will trigger a pass if the perl regex pattern is not present in raw content. | |
DrupalWebTestCase:: |
protected | function | Pass if the raw text is NOT found on the loaded page, fail otherwise. Raw text refers to the raw HTML that the page generated. | |
DrupalWebTestCase:: |
protected | function | Asserts the page did not return the specified response code. | |
DrupalWebTestCase:: |
protected | function | Pass if the text is NOT found on the text version of the page. The text version is the equivalent of what a user would see when viewing through a web browser. In other words the HTML has been filtered out of the contents. | |
DrupalWebTestCase:: |
protected | function | Pass if the page title is not the given string. | |
DrupalWebTestCase:: |
protected | function | Pass if the text is found MORE THAN ONCE on the text version of the page. | |
DrupalWebTestCase:: |
protected | function | Asserts that a select option in the current page is checked. | |
DrupalWebTestCase:: |
protected | function | Will trigger a pass if the Perl regex pattern is found in the raw content. | |
DrupalWebTestCase:: |
protected | function | Pass if the raw text IS found on the loaded page, fail otherwise. Raw text refers to the raw HTML that the page generated. | |
DrupalWebTestCase:: |
protected | function | Asserts the page responds with the specified response code. | |
DrupalWebTestCase:: |
protected | function | Pass if the text IS found on the text version of the page. The text version is the equivalent of what a user would see when viewing through a web browser. In other words the HTML has been filtered out of the contents. | |
DrupalWebTestCase:: |
protected | function | Helper for assertText and assertNoText. | |
DrupalWebTestCase:: |
protected | function | Asserts themed output. | |
DrupalWebTestCase:: |
protected | function | Pass if the page title is the given string. | |
DrupalWebTestCase:: |
protected | function | Pass if the text is found ONLY ONCE on the text version of the page. | |
DrupalWebTestCase:: |
protected | function | Helper for assertUniqueText and assertNoUniqueText. | |
DrupalWebTestCase:: |
protected | function | Pass if the internal browser's URL matches the given path. | |
DrupalWebTestCase:: |
protected | function | Builds an XPath query. | |
DrupalWebTestCase:: |
protected | function | Changes the database connection to the prefixed one. | |
DrupalWebTestCase:: |
protected | function | Check for meta refresh tag and if found call drupalGet() recursively. This function looks for the http-equiv attribute to be set to "Refresh" and is case-sensitive. | |
DrupalWebTestCase:: |
protected | function | Check to make sure that the array of permissions are valid. | |
DrupalWebTestCase:: |
protected | function | Follows a link by name. | |
DrupalWebTestCase:: |
protected | function | Helper function: construct an XPath for the given set of attributes and value. | |
DrupalWebTestCase:: |
protected | function | Copy the setup cache from/to another table and files directory. | |
DrupalWebTestCase:: |
protected | function | Runs cron in the Drupal installed by Simpletest. | |
DrupalWebTestCase:: |
protected | function | Close the cURL handler and unset the handler. | |
DrupalWebTestCase:: |
protected | function | Initializes and executes a cURL request. | |
DrupalWebTestCase:: |
protected | function | Reads headers and registers errors received from the tested site. | |
DrupalWebTestCase:: |
protected | function | Initializes the cURL connection. | |
DrupalWebTestCase:: |
protected | function | Compare two files based on size and file name. | |
DrupalWebTestCase:: |
protected | function | Creates a custom content type based on default settings. | |
DrupalWebTestCase:: |
protected | function | Creates a node based on default settings. | |
DrupalWebTestCase:: |
protected | function | Creates a role with specified permissions. | |
DrupalWebTestCase:: |
protected | function | Create a user with a given set of permissions. | |
DrupalWebTestCase:: |
protected | function | Retrieves a Drupal path or an absolute path. | |
DrupalWebTestCase:: |
protected | function | Retrieve a Drupal path or an absolute path and JSON decode the result. | |
DrupalWebTestCase:: |
protected | function | Gets the current raw HTML of requested page. | |
DrupalWebTestCase:: |
protected | function | Gets the value of an HTTP response header. If multiple requests were required to retrieve the page, only the headers from the last request will be checked by default. However, if TRUE is passed as the second argument, all requests will be processed… | |
DrupalWebTestCase:: |
protected | function | Gets the HTTP response headers of the requested page. Normally we are only interested in the headers returned by the last request. However, if a page is redirected or HTTP authentication is in use, multiple requests will be required to retrieve the… | |
DrupalWebTestCase:: |
protected | function | Gets an array containing all e-mails sent during this test case. | |
DrupalWebTestCase:: |
function | Get a node from the database based on its title. | ||
DrupalWebTestCase:: |
protected | function | Gets the value of the Drupal.settings JavaScript variable for the currently loaded page. | |
DrupalWebTestCase:: |
protected | function | Get a list files that can be used in tests. | |
DrupalWebTestCase:: |
protected | function | Generate a token for the currently logged in user. | |
DrupalWebTestCase:: |
protected | function | Retrieves only the headers for a Drupal path or an absolute path. | |
DrupalWebTestCase:: |
protected | function | Log in a user with the internal browser. | |
DrupalWebTestCase:: |
protected | function | ||
DrupalWebTestCase:: |
protected | function | Execute a POST request on a Drupal page. It will be done as usual POST request with SimpleBrowser. | |
DrupalWebTestCase:: |
protected | function | Execute an Ajax submission. | |
DrupalWebTestCase:: |
protected | function | Sets the raw HTML content. This can be useful when a page has been fetched outside of the internal browser and assertions need to be made on the returned page. | |
DrupalWebTestCase:: |
protected | function | Sets the value of the Drupal.settings JavaScript variable for the currently loaded page. | |
DrupalWebTestCase:: |
protected | function | Takes a path and returns an absolute path. | |
DrupalWebTestCase:: |
protected | function | Get all option elements, including nested options, in a select. | |
DrupalWebTestCase:: |
protected | function | Get the selected value from a select field. | |
DrupalWebTestCase:: |
protected | function | Returns the cache key used for the setup caching. | |
DrupalWebTestCase:: |
protected | function | Get the current URL from the cURL handler. | |
DrupalWebTestCase:: |
protected | function | Handle form input related to drupalPost(). Ensure that the specified fields exist and attempt to create POST data in the correct manner for the particular field type. | |
DrupalWebTestCase:: |
protected | function | Copies the cached tables and files for a cached installation setup. | |
DrupalWebTestCase:: |
protected | function | Parse content returned from curlExec using DOM and SimpleXML. | |
DrupalWebTestCase:: |
protected | function | Preload the registry from the testing site. | |
DrupalWebTestCase:: |
protected | function | Generates a database prefix for running tests. | |
DrupalWebTestCase:: |
protected | function | Prepares the current environment for running the test. | |
DrupalWebTestCase:: |
protected | function | Recursively copy one directory to another. | |
DrupalWebTestCase:: |
protected | function | Refresh the in-memory set of variables. Useful after a page request is made that changes a variable in a different thread. | 1 |
DrupalWebTestCase:: |
protected | function | Reset all data structures after having enabled new modules. | |
DrupalWebTestCase:: |
protected | function | Store the installation setup to a cache. | |
DrupalWebTestCase:: |
protected | function | Delete created files and temporary files directory, delete the tables created by setUp(), and reset the database prefix. | 6 |
DrupalWebTestCase:: |
protected | function | Outputs to verbose the most recent $count emails sent. | |
DrupalWebTestCase:: |
protected | function | Perform an xpath search on the contents of the internal browser. The search is relative to the root element (HTML tag normally) of the page. | |
DrupalWebTestCase:: |
function |
Constructor for DrupalWebTestCase. Overrides DrupalTestCase:: |
1 | |
PorterStemmerInternalsUnitTest:: |
public static | function | ||
PorterStemmerInternalsUnitTest:: |
public | function |
Sets up a Drupal site for running functional and integration tests. Overrides DrupalWebTestCase:: |
|
PorterStemmerInternalsUnitTest:: |
function | Test internal steps on the word "administered". | ||
PorterStemmerInternalsUnitTest:: |
function | Test internal steps on the word "baked". | ||
PorterStemmerInternalsUnitTest:: |
function | Tests the excerpt function porterstemmer_sbp_excerpt_match(). | ||
PorterStemmerInternalsUnitTest:: |
function | Test internal steps on the word "geology". | ||
PorterStemmerInternalsUnitTest:: |
function | Test internal steps on the words "ies" and "ied". | ||
PorterStemmerInternalsUnitTest:: |
function | Tests the function that determines if a word is "short". | ||
PorterStemmerInternalsUnitTest:: |
function | Verify that short words are not stemmed, and longer ones are. | ||
PorterStemmerInternalsUnitTest:: |
function | Verify that short words are not stemmed, and longer ones are. |