BUG Exclude meta info from SolrCell content retrieval

Was matching </str> greedily, which included too much content
2024-10-22 09:06:00 +00:00 · 2013-03-11 00:56:44 +01:00 · 2013-03-11 00:56:44 +01:00 · f2c8df2348
commit f2c8df2348
parent 9af389f51b
1 changed files with 1 additions and 1 deletions
--- a/code/extractors/SolrCellTextExtractor.php
+++ b/code/extractors/SolrCellTextExtractor.php
@ -55,7 +55,7 @@ class SolrCellTextExtractor extends FileTextExtractor {
 		$response = $request->send();
 		// Use preg match to avoid SimpleXML running out of memory on large text nodes
 		preg_match(
-			sprintf('/\<str name\="%s"\>(.*)\<\/str\>/s', preg_quote($fileName)),
+			sprintf('/\<str name\="%s"\>(.*?)\<\/str\>/s', preg_quote($fileName)),
 			(string)$response->getBody(), 
 			$matches
 		);