File tree Expand file tree Collapse file tree 2 files changed +13
-1
lines changed Expand file tree Collapse file tree 2 files changed +13
-1
lines changed Original file line number Diff line number Diff line change @@ -160,7 +160,9 @@ protected function generateTermScoreMapFromHtml(string $html): array
160
160
/** @var DOMNode $child */
161
161
foreach ($ doc ->getBodyChildren () as $ child ) {
162
162
$ nodeName = $ child ->nodeName ;
163
- $ termCounts = $ this ->textToTermCountMap (trim ($ child ->textContent ));
163
+ $ text = trim ($ child ->textContent );
164
+ $ text = str_replace ("\u{00A0}" , ' ' , $ text );
165
+ $ termCounts = $ this ->textToTermCountMap ($ text );
164
166
foreach ($ termCounts as $ term => $ count ) {
165
167
$ scoreChange = $ count * ($ elementScoreAdjustmentMap [$ nodeName ] ?? 1 );
166
168
$ scoresByTerm [$ term ] = ($ scoresByTerm [$ term ] ?? 0 ) + $ scoreChange ;
Original file line number Diff line number Diff line change @@ -106,4 +106,14 @@ public function test_terms_containing_punctuation_within_retain_original_form_an
106
106
$ this ->assertNull ($ scoreByTerm ->get ($ term ), "Failed asserting that \"$ term \" is not indexed " );
107
107
}
108
108
}
109
+
110
+ public function test_non_breaking_spaces_handled_as_spaces ()
111
+ {
112
+ $ page = $ this ->entities ->newPage (['html ' => '<p>a tigerbadger is a dangerous animal</p> ' ]);
113
+
114
+ $ scoreByTerm = $ page ->searchTerms ()->pluck ('score ' , 'term ' );
115
+ $ this ->assertNotNull ($ scoreByTerm ->get ('tigerbadger ' ));
116
+ $ this ->assertNotNull ($ scoreByTerm ->get ('dangerous ' ));
117
+ $ this ->assertNotNull ($ scoreByTerm ->get ('animal ' ));
118
+ }
109
119
}
You can’t perform that action at this time.
0 commit comments