@@ -39,7 +39,7 @@ class PortugueseStemmer implements StemmerInterface
3939 /**
4040 * UTF-8 Case lookup table
4141 *
42- * This lookuptable defines the upper case letters to their correspponding
42+ * This lookup table defines the upper case letters to their corresponding
4343 * lower case letter in UTF-8
4444 *
4545 * @author Andreas Gohr <[email protected] > @@ -71,23 +71,22 @@ class PortugueseStemmer implements StemmerInterface
7171 0x0066 => 0x0046 , 0x00FD => 0x00DD , 0x0063 => 0x0043 , 0x021B => 0x021A , 0x00EA => 0x00CA ,
7272 0x03B9 => 0x0399 , 0x017A => 0x0179 , 0x00EF => 0x00CF , 0x01B0 => 0x01AF , 0x0065 => 0x0045 ,
7373 0x03BB => 0x039B , 0x03B8 => 0x0398 , 0x03BC => 0x039C , 0x045C => 0x040C , 0x043F => 0x041F ,
74- 0x044C => 0x042C , 0x00FE => 0x00DE , 0x00F0 => 0x00D0 , 0x1EF3 => 0x1EF2 , 0x0068 => 0x0048 ,
75- 0x00EB => 0x00CB , 0x0111 => 0x0110 , 0x0433 => 0x0413 , 0x012F => 0x012E , 0x00E6 => 0x00C6 ,
76- 0x0078 => 0x0058 , 0x0161 => 0x0160 , 0x016F => 0x016E , 0x03B1 => 0x0391 , 0x0457 => 0x0407 ,
77- 0x0173 => 0x0172 , 0x00FF => 0x0178 , 0x006F => 0x004F , 0x043B => 0x041B , 0x03B5 => 0x0395 ,
78- 0x0445 => 0x0425 , 0x0121 => 0x0120 , 0x017E => 0x017D , 0x017C => 0x017B , 0x03B6 => 0x0396 ,
79- 0x03B2 => 0x0392 , 0x03AD => 0x0388 , 0x1E85 => 0x1E84 , 0x0175 => 0x0174 , 0x0071 => 0x0051 ,
80- 0x0437 => 0x0417 , 0x1E0B => 0x1E0A , 0x0148 => 0x0147 , 0x0105 => 0x0104 , 0x0458 => 0x0408 ,
81- 0x014D => 0x014C , 0x00ED => 0x00CD , 0x0079 => 0x0059 , 0x010B => 0x010A , 0x03CE => 0x038F ,
82- 0x0072 => 0x0052 , 0x0430 => 0x0410 , 0x0455 => 0x0405 , 0x0452 => 0x0402 , 0x0127 => 0x0126 ,
83- 0x0137 => 0x0136 , 0x012B => 0x012A , 0x03AF => 0x038A , 0x044B => 0x042B , 0x006C => 0x004C ,
84- 0x03B7 => 0x0397 , 0x0125 => 0x0124 , 0x0219 => 0x0218 , 0x00FB => 0x00DB , 0x011F => 0x011E ,
85- 0x043E => 0x041E , 0x1E41 => 0x1E40 , 0x03BD => 0x039D , 0x0107 => 0x0106 , 0x03CB => 0x03AB ,
86- 0x0446 => 0x0426 , 0x00FE => 0x00DE , 0x00E7 => 0x00C7 , 0x03CA => 0x03AA , 0x0441 => 0x0421 ,
87- 0x0432 => 0x0412 , 0x010F => 0x010E , 0x00F8 => 0x00D8 , 0x0077 => 0x0057 , 0x011B => 0x011A ,
88- 0x0074 => 0x0054 , 0x006A => 0x004A , 0x045B => 0x040B , 0x0456 => 0x0406 , 0x0103 => 0x0102 ,
89- 0x03BB => 0x039B , 0x00F1 => 0x00D1 , 0x043D => 0x041D , 0x03CC => 0x038C , 0x00E9 => 0x00C9 ,
90- 0x00F0 => 0x00D0 , 0x0457 => 0x0407 , 0x0123 => 0x0122
74+ 0x044C => 0x042C , 0x1EF3 => 0x1EF2 , 0x0068 => 0x0048 , 0x00EB => 0x00CB , 0x0111 => 0x0110 ,
75+ 0x0433 => 0x0413 , 0x012F => 0x012E , 0x00E6 => 0x00C6 , 0x0078 => 0x0058 , 0x0161 => 0x0160 ,
76+ 0x016F => 0x016E , 0x03B1 => 0x0391 , 0x0457 => 0x0407 , 0x0173 => 0x0172 , 0x00FF => 0x0178 ,
77+ 0x006F => 0x004F , 0x043B => 0x041B , 0x03B5 => 0x0395 , 0x0445 => 0x0425 , 0x0121 => 0x0120 ,
78+ 0x017E => 0x017D , 0x017C => 0x017B , 0x03B6 => 0x0396 , 0x03B2 => 0x0392 , 0x03AD => 0x0388 ,
79+ 0x1E85 => 0x1E84 , 0x0175 => 0x0174 , 0x0071 => 0x0051 , 0x0437 => 0x0417 , 0x1E0B => 0x1E0A ,
80+ 0x0148 => 0x0147 , 0x0105 => 0x0104 , 0x0458 => 0x0408 , 0x014D => 0x014C , 0x00ED => 0x00CD ,
81+ 0x0079 => 0x0059 , 0x010B => 0x010A , 0x03CE => 0x038F , 0x0072 => 0x0052 , 0x0430 => 0x0410 ,
82+ 0x0455 => 0x0405 , 0x0452 => 0x0402 , 0x0127 => 0x0126 , 0x0137 => 0x0136 , 0x012B => 0x012A ,
83+ 0x03AF => 0x038A , 0x044B => 0x042B , 0x006C => 0x004C , 0x03B7 => 0x0397 , 0x0125 => 0x0124 ,
84+ 0x0219 => 0x0218 , 0x00FB => 0x00DB , 0x011F => 0x011E , 0x043E => 0x041E , 0x1E41 => 0x1E40 ,
85+ 0x03BD => 0x039D , 0x0107 => 0x0106 , 0x03CB => 0x03AB , 0x0446 => 0x0426 , 0x00E7 => 0x00C7 ,
86+ 0x03CA => 0x03AA , 0x0441 => 0x0421 , 0x0432 => 0x0412 , 0x010F => 0x010E , 0x00F8 => 0x00D8 ,
87+ 0x0077 => 0x0057 , 0x011B => 0x011A , 0x0074 => 0x0054 , 0x006A => 0x004A , 0x045B => 0x040B ,
88+ 0x0456 => 0x0406 , 0x0103 => 0x0102 , 0x00F1 => 0x00D1 , 0x043D => 0x041D , 0x03CC => 0x038C ,
89+ 0x00E9 => 0x00C9 , 0x0123 => 0x0122
9190 ];
9291
9392 private static array $ vowels = ['a ' , 'e ' , 'i ' , 'o ' , 'u ' , 'á ' , 'é ' , 'í ' , 'ó ' , 'ú ' , 'â ' , 'ê ' , 'ô ' ];
@@ -419,7 +418,7 @@ private static function step1(&$word, $r1Index, $r2Index, $rvIndex)
419418 $ before = $ position - 1 ;
420419 $ letter = self ::substr ($ word , $ before , 1 );
421420
422- if ($ letter == 'e ' ) {
421+ if ($ letter === 'e ' ) {
423422 $ word = preg_replace ('#(iras|ira)$#u ' , 'ir ' , $ word );
424423 }
425424 }
@@ -455,7 +454,7 @@ private static function step3(&$word, $rvIndex)
455454 if (self ::searchIfInRv ($ word , ['i ' ], $ rvIndex ) !== false ) {
456455 $ letter = self ::substr ($ word , -2 , 1 );
457456
458- if ($ letter == 'c ' ) {
457+ if ($ letter === 'c ' ) {
459458 $ word = self ::substr ($ word , 0 , -1 );
460459 }
461460
0 commit comments