From e8265f07592937f149d0b1e4ba78898b71b86d10 Mon Sep 17 00:00:00 2001 From: Steven Wittens Date: Tue, 30 Dec 2003 05:58:17 +0000 Subject: - Bugfix: the XML parser in PHP4 requires you to specify the input encoding explicitly. Added a short piece of code that does this. (see drupal.org's Drupal Talk to see this bug in action) --- modules/aggregator.module | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) (limited to 'modules/aggregator.module') diff --git a/modules/aggregator.module b/modules/aggregator.module index fc6012319..be29a8995 100644 --- a/modules/aggregator.module +++ b/modules/aggregator.module @@ -325,8 +325,13 @@ function import_refresh($feed) { return t("failed to parse RSS feed '%site': suspicious input data.", array("%site" => $feed["title"])); } + // extract the XML file's encoding (the XML parser in PHP4 doesn't do this by itself): + if (ereg('encoding="([^"]+)"', $data, $match)) { + $encoding = $match[1]; + } + // parse the data: - $xml_parser = xml_parser_create(); + $xml_parser = xml_parser_create($encoding); xml_set_element_handler($xml_parser, "import_element_start", "import_element_end"); xml_set_character_data_handler($xml_parser, "import_element_data"); xml_parser_set_option($xml_parser, XML_OPTION_TARGET_ENCODING, "utf-8"); -- cgit v1.2.3