From 9c5708cc92af894e414bc76ee35ec2230de5d288 Mon Sep 17 00:00:00 2001
From: Agustin Henze <tin@sluc.org.ar>
Date: Wed, 2 Jan 2013 08:35:03 -0300
Subject: Imported Upstream version 5.1

---
 tests/context.py                       |   9 +
 tests/rss-2_0.xsd                      | 500 +++++++++++++++++++++++++++++++++
 tests/test_command_import_wordpress.py |  92 ++++++
 tests/test_rss_feeds.py                | 104 +++++++
 tests/wordpress_export_example.xml     | 174 ++++++++++++
 tests/wordpress_unicode_export.xml     | 114 ++++++++
 6 files changed, 993 insertions(+)
 create mode 100644 tests/context.py
 create mode 100644 tests/rss-2_0.xsd
 create mode 100644 tests/test_command_import_wordpress.py
 create mode 100644 tests/test_rss_feeds.py
 create mode 100644 tests/wordpress_export_example.xml
 create mode 100644 tests/wordpress_unicode_export.xml

(limited to 'tests')

diff --git a/tests/context.py b/tests/context.py
new file mode 100644
index 0000000..f292b79
--- /dev/null
+++ b/tests/context.py
@@ -0,0 +1,9 @@
+# -*- coding: utf-8 -*-
+
+# Path hack as shown by Kenneth Reitz at http://kennethreitz.com/repository-structure-and-python.html
+
+import os
+import sys
+sys.path.insert(0, os.path.abspath('..'))
+
+import nikola
diff --git a/tests/rss-2_0.xsd b/tests/rss-2_0.xsd
new file mode 100644
index 0000000..d7ddaee
--- /dev/null
+++ b/tests/rss-2_0.xsd
@@ -0,0 +1,500 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+    XML Schema for RSS v2.0
+    Copyright (C) 2003-2008  Jorgen Thelin
+
+Microsoft Public License (Ms-PL)
+
+This license governs use of the accompanying software. 
+If you use the software, you accept this license. 
+If you do not accept the license, do not use the software.
+
+1. Definitions
+
+The terms "reproduce," "reproduction," "derivative works," and "distribution" have the same meaning here as under U.S. copyright law.
+
+    A "contribution" is the original software, or any additions or changes to the software.
+
+    A "contributor" is any person that distributes its contribution under this license.
+
+    "Licensed patents" are a contributor's patent claims that read directly on its contribution.
+
+2. Grant of Rights
+
+    (A) Copyright Grant- Subject to the terms of this license, including the license conditions and limitations in section 3, each contributor grants you a non-exclusive, worldwide, royalty-free copyright license to reproduce its contribution, prepare derivative works of its contribution, and distribute its contribution or any derivative works that you create.
+
+    (B) Patent Grant- Subject to the terms of this license, including the license conditions and limitations in section 3, each contributor grants you a non-exclusive, worldwide, royalty-free license under its licensed patents to make, have made, use, sell, offer for sale, import, and/or otherwise dispose of its contribution in the software or derivative works of the contribution in the software.
+
+3. Conditions and Limitations
+
+    (A) No Trademark License- This license does not grant you rights to use any contributors' name, logo, or trademarks.
+
+    (B) If you bring a patent claim against any contributor over patents that you claim are infringed by the software, your patent license from such contributor to the software ends automatically.
+
+    (C) If you distribute any portion of the software, you must retain all copyright, patent, trademark, and attribution notices that are present in the software.
+
+    (D) If you distribute any portion of the software in source code form, you may do so only under this license by including a complete copy of this license with your distribution. If you distribute any portion of the software in compiled or object code form, you may only do so under a license that complies with this license.
+
+    (E) The software is licensed "as-is." You bear the risk of using it. The contributors give no express warranties, guarantees or conditions. You may have additional consumer rights under your local laws which this license cannot change. To the extent permitted under your local laws, the contributors exclude the implied warranties of merchantability, fitness for a particular purpose and non-infringement. 
+
+-->
+<xs:schema xmlns:xs="http://www.w3.org/2001/XMLSchema" 
+           elementFormDefault="unqualified" 
+           version="2.0.2.16">
+  <xs:annotation>
+    <xs:documentation>XML Schema for RSS v2.0 feed files.</xs:documentation>
+    <xs:documentation>Project home: http://www.codeplex.com/rss2schema/ </xs:documentation>
+    <xs:documentation>Based on the RSS 2.0 specification document at http://cyber.law.harvard.edu/rss/rss.html </xs:documentation>
+    <xs:documentation>Author: Jorgen Thelin</xs:documentation>
+    <xs:documentation>Revision: 16</xs:documentation>
+    <xs:documentation>Date: 01-Nov-2008</xs:documentation>
+    <xs:documentation>Feedback to: http://www.codeplex.com/rss2schema/WorkItem/List.aspx </xs:documentation>
+  </xs:annotation>
+  <xs:element name="rss">
+    <xs:complexType>
+      <xs:sequence>
+        <xs:element name="channel" type="RssChannel"/>
+        <xs:any namespace="##other" processContents="lax" minOccurs="0" maxOccurs="unbounded"/>
+      </xs:sequence>
+      <xs:attribute name="version" type="xs:decimal" use="required" fixed="2.0"/>
+      <xs:anyAttribute namespace="##any"/>
+    </xs:complexType>
+  </xs:element>
+  <xs:complexType name="RssItem">
+    <xs:annotation>
+      <xs:documentation>An item may represent a "story" -- much like a story in a newspaper or magazine; if so its description is a synopsis of the story, and the link points to the full story. An item may also be complete in itself, if so, the description contains the text (entity-encoded HTML is allowed), and the link and title may be omitted.</xs:documentation>
+    </xs:annotation>
+    <xs:sequence>
+      <xs:choice maxOccurs="unbounded">
+        <xs:element name="title" type="xs:string" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>The title of the item.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="description" type="xs:string" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>The item synopsis.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="link" type="xs:anyURI" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>The URL of the item.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="author" type="EmailAddress" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Email address of the author of the item.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="category" type="Category" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Includes the item in one or more categories. </xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="comments" type="xs:anyURI" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>URL of a page for comments relating to the item.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="enclosure" type="Enclosure" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Describes a media object that is attached to the item.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="guid" type="Guid" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>guid or permalink URL for this entry</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="pubDate" type="Rfc822FormatDate" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Indicates when the item was published.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="source" type="Source" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>The RSS channel that the item came from.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:any namespace="##other" processContents="lax" minOccurs="0" maxOccurs="unbounded">
+          <xs:annotation>
+            <xs:documentation>Extensibility element.</xs:documentation>
+          </xs:annotation>
+        </xs:any>
+      </xs:choice>
+    </xs:sequence>
+    <xs:anyAttribute namespace="##any"/>
+  </xs:complexType>
+  <xs:complexType name="RssChannel">
+    <xs:sequence>
+      <xs:choice maxOccurs="unbounded">
+        <xs:element name="title" type="xs:string">
+          <xs:annotation>
+            <xs:documentation>The name of the channel. It's how people refer to your service. If you have an HTML website that contains the same information as your RSS file, the title of your channel should be the same as the title of your website.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="link" type="xs:anyURI">
+          <xs:annotation>
+            <xs:documentation>The URL to the HTML website corresponding to the channel.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="description" type="xs:string">
+          <xs:annotation>
+            <xs:documentation>Phrase or sentence describing the channel.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="language" type="xs:language" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>The language the channel is written in. This allows aggregators to group all Italian language sites, for example, on a single page. A list of allowable values for this element, as provided by Netscape, is here. You may also use values defined by the W3C.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="copyright" type="xs:string" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Copyright notice for content in the channel.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="managingEditor" type="EmailAddress" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Email address for person responsible for editorial content.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="webMaster" type="EmailAddress" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Email address for person responsible for technical issues relating to channel.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="pubDate" type="Rfc822FormatDate" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>The publication date for the content in the channel. All date-times in RSS conform to the Date and Time Specification of RFC 822, with the exception that the year may be expressed with two characters or four characters (four preferred).</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="lastBuildDate" type="Rfc822FormatDate" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>The last time the content of the channel changed.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="category" type="Category" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Specify one or more categories that the channel belongs to.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="generator" type="xs:string" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>A string indicating the program used to generate the channel.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="docs" type="xs:anyURI" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>A URL that points to the documentation for the format used in the RSS file. It's probably a pointer to this page. It's for people who might stumble across an RSS file on a Web server 25 years from now and wonder what it is.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="cloud" type="Cloud" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Allows processes to register with a cloud to be notified of updates to the channel, implementing a lightweight publish-subscribe protocol for RSS feeds.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="ttl" type="xs:nonNegativeInteger" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>ttl stands for time to live. It's a number of minutes that indicates how long a channel can be cached before refreshing from the source.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="image" type="Image" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Specifies a GIF, JPEG or PNG image that can be displayed with the channel.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="rating" type="xs:string" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>The PICS rating for the channel.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="textInput" type="TextInput" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>Specifies a text input box that can be displayed with the channel.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="skipHours" type="SkipHoursList" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>A hint for aggregators telling them which hours they can skip.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:element name="skipDays" type="SkipDaysList" minOccurs="0">
+          <xs:annotation>
+            <xs:documentation>A hint for aggregators telling them which days they can skip.</xs:documentation>
+          </xs:annotation>
+        </xs:element>
+        <xs:any namespace="##other" processContents="lax" minOccurs="0" maxOccurs="unbounded">
+          <xs:annotation>
+            <xs:documentation>Extensibility element.</xs:documentation>
+          </xs:annotation>
+        </xs:any>
+      </xs:choice>
+      <xs:element name="item" type="RssItem" minOccurs="1" maxOccurs="unbounded">
+         <!-- 
+           HACK: According to the RSS 2.0 spec, it should strictly be possible to have zero item elements, 
+                 but this makes the schema non-deterministic with regard to extensibility elements
+                 so for the moment we undid bug-fix 10231 and set minOccurs=1 to work around this problem. 
+         -->
+      </xs:element>
+      <xs:any namespace="##other" processContents="lax" minOccurs="0" maxOccurs="unbounded">
+        <xs:annotation>
+          <xs:documentation>Extensibility element.</xs:documentation>
+        </xs:annotation>
+      </xs:any>
+    </xs:sequence>
+    <xs:anyAttribute namespace="##any"/>
+  </xs:complexType>
+  <xs:simpleType name="SkipHour">
+    <xs:annotation>
+      <xs:documentation>A time in GMT when aggregators should not request the channel data. The hour beginning at midnight is hour zero.</xs:documentation>
+    </xs:annotation>
+    <xs:restriction base="xs:nonNegativeInteger">
+      <xs:minInclusive value="0"/>
+      <xs:maxInclusive value="23"/>
+    </xs:restriction>
+  </xs:simpleType>
+  <xs:complexType name="SkipHoursList">
+    <xs:sequence>
+      <xs:element name="hour" type="SkipHour" minOccurs="0" maxOccurs="24"/>
+    </xs:sequence>
+  </xs:complexType>
+  <xs:simpleType name="SkipDay">
+    <xs:annotation>
+      <xs:documentation>A day when aggregators should not request the channel data.</xs:documentation>
+    </xs:annotation>
+    <xs:restriction base="xs:string">
+      <xs:enumeration value="Monday"/>
+      <xs:enumeration value="Tuesday"/>
+      <xs:enumeration value="Wednesday"/>
+      <xs:enumeration value="Thursday"/>
+      <xs:enumeration value="Friday"/>
+      <xs:enumeration value="Saturday"/>
+      <xs:enumeration value="Sunday"/>
+    </xs:restriction>
+  </xs:simpleType>
+  <xs:complexType name="SkipDaysList">
+    <xs:sequence>
+      <xs:element name="day" type="SkipDay" minOccurs="0" maxOccurs="7">
+        <xs:annotation>
+          <xs:documentation>A time in GMT, when aggregators should not request the channel data. The hour beginning at midnight is hour zero.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+    </xs:sequence>
+  </xs:complexType>
+  <xs:complexType name="Category">
+    <xs:simpleContent>
+      <xs:extension base="xs:string">
+        <xs:attribute name="domain" type="xs:string" use="optional"/>
+      </xs:extension>
+    </xs:simpleContent>
+  </xs:complexType>
+  <xs:complexType name="Image">
+    <xs:all>
+      <xs:element name="url" type="xs:anyURI">
+        <xs:annotation>
+          <xs:documentation>The URL of the image file.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+      <xs:element name="title" type="xs:string">
+        <xs:annotation>
+          <xs:documentation>Describes the image, it's used in the ALT attribute of the HTML &lt;img&gt; tag when the channel is rendered in HTML.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+      <xs:element name="link" type="xs:anyURI">
+        <xs:annotation>
+          <xs:documentation>The URL of the site, when the channel is rendered, the image is a link to the site. (Note, in practice the image &lt;title&gt; and &lt;link&gt; should have the same value as the channel's &lt;title&gt; and &lt;link&gt;. </xs:documentation>
+        </xs:annotation>
+      </xs:element>
+      <xs:element name="width" type="ImageWidth" default="88" minOccurs="0">
+        <xs:annotation>
+          <xs:documentation>The width of the image in pixels.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+      <xs:element name="height" type="ImageHeight" default="31" minOccurs="0">
+        <xs:annotation>
+          <xs:documentation>The height of the image in pixels.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+      <xs:element name="description" type="xs:string" minOccurs="0">
+        <xs:annotation>
+          <xs:documentation>Text that is included in the TITLE attribute of the link formed around the image in the HTML rendering.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+    </xs:all>
+  </xs:complexType>
+  <xs:simpleType name="ImageHeight">
+    <xs:annotation>
+      <xs:documentation>The height of the image in pixels.</xs:documentation>
+    </xs:annotation>
+    <xs:restriction base="xs:positiveInteger">
+      <xs:maxInclusive value="400"/>
+    </xs:restriction>
+  </xs:simpleType>
+  <xs:simpleType name="ImageWidth">
+    <xs:annotation>
+      <xs:documentation>The width of the image in pixels.</xs:documentation>
+    </xs:annotation>
+    <xs:restriction base="xs:positiveInteger">
+      <xs:maxInclusive value="144"/>
+    </xs:restriction>
+  </xs:simpleType>
+  <xs:complexType name="Cloud">
+    <xs:annotation>
+      <xs:documentation>Specifies a web service that supports the rssCloud interface which can be implemented in HTTP-POST, XML-RPC or SOAP 1.1. Its purpose is to allow processes to register with a cloud to be notified of updates to the channel, implementing a lightweight publish-subscribe protocol for RSS feeds.</xs:documentation>
+    </xs:annotation>
+    <xs:attribute name="domain" type="xs:string" use="required"/>
+    <xs:attribute name="port" type="xs:positiveInteger" use="required"/>
+    <xs:attribute name="path" type="xs:string" use="required"/>
+    <xs:attribute name="registerProcedure" type="xs:string" use="required"/>
+    <xs:attribute name="protocol" type="CloudProtocol" use="required"/>
+  </xs:complexType>
+  <xs:simpleType name="CloudProtocol">
+    <xs:restriction base="xs:string">
+      <xs:enumeration value="xml-rpc"/>
+      <xs:enumeration value="http-post"/>
+      <xs:enumeration value="soap"/>
+    </xs:restriction>
+  </xs:simpleType>
+  <xs:complexType name="TextInput">
+    <xs:annotation>
+      <xs:documentation>The purpose of this element is something of a mystery! You can use it to specify a search engine box. Or to allow a reader to provide feedback. Most aggregators ignore it.</xs:documentation>
+    </xs:annotation>
+    <xs:all>
+      <xs:element name="title" type="xs:string">
+        <xs:annotation>
+          <xs:documentation>The label of the Submit button in the text input area.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+      <xs:element name="description" type="xs:string">
+        <xs:annotation>
+          <xs:documentation>Explains the text input area.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+      <xs:element name="name" type="xs:string">
+        <xs:annotation>
+          <xs:documentation>The name of the text object in the text input area.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+      <xs:element name="link" type="xs:anyURI">
+        <xs:annotation>
+          <xs:documentation>The URL of the CGI script that processes text input requests.</xs:documentation>
+        </xs:annotation>
+      </xs:element>
+    </xs:all>
+  </xs:complexType>
+  <xs:simpleType name="EmailAddress">
+    <xs:annotation>
+      <xs:documentation>Using the regexp definiton of E-Mail Address by Lucadean from the .NET RegExp Pattern Repository at http://www.3leaf.com/default/NetRegExpRepository.aspx </xs:documentation>
+    </xs:annotation>
+    <xs:restriction base="xs:string">
+      <xs:pattern value="([a-zA-Z0-9_\-])([a-zA-Z0-9_\-\.]*)@(\[((25[0-5]|2[0-4][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])\.){3}|((([a-zA-Z0-9\-]+)\.)+))([a-zA-Z]{2,}|(25[0-5]|2[0-4][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])\])"/>
+    </xs:restriction>
+  </xs:simpleType>
+  <xs:simpleType name="Rfc822FormatDate">
+    <xs:annotation>
+      <xs:documentation>A date-time displayed in RFC-822 format.</xs:documentation>
+      <xs:documentation>Using the regexp definiton of rfc-822 date by Sam Ruby at http://www.intertwingly.net/blog/1360.html </xs:documentation>
+    </xs:annotation>
+    <xs:restriction base="xs:string">
+      <xs:pattern value="(((Mon)|(Tue)|(Wed)|(Thu)|(Fri)|(Sat)|(Sun)), *)?\d\d? +((Jan)|(Feb)|(Mar)|(Apr)|(May)|(Jun)|(Jul)|(Aug)|(Sep)|(Oct)|(Nov)|(Dec)) +\d\d(\d\d)? +\d\d:\d\d(:\d\d)? +(([+\-]?\d\d\d\d)|(UT)|(GMT)|(EST)|(EDT)|(CST)|(CDT)|(MST)|(MDT)|(PST)|(PDT)|\w)"/>
+    </xs:restriction>
+  </xs:simpleType>
+  <xs:complexType name="Source">
+    <xs:simpleContent>
+      <xs:extension base="xs:string">
+        <xs:attribute name="url" type="xs:anyURI"/>
+      </xs:extension>
+    </xs:simpleContent>
+  </xs:complexType>
+  <xs:complexType name="Enclosure">
+    <xs:simpleContent>
+      <xs:extension base="xs:string">
+        <xs:attribute name="url" type="xs:anyURI" use="required">
+          <xs:annotation>
+            <xs:documentation>URL where the enclosure is located</xs:documentation>
+          </xs:annotation>
+        </xs:attribute>
+        <xs:attribute name="length" type="xs:nonNegativeInteger" use="required">
+          <xs:annotation>
+            <xs:documentation>Size in bytes</xs:documentation>
+          </xs:annotation>
+        </xs:attribute>
+        <xs:attribute name="type" type="xs:string" use="required">
+          <xs:annotation>
+            <xs:documentation>MIME media-type of the enclosure</xs:documentation>
+          </xs:annotation>
+        </xs:attribute>
+      </xs:extension>
+    </xs:simpleContent>
+  </xs:complexType>
+  <xs:complexType name="Guid">
+    <xs:simpleContent>
+      <xs:extension base="xs:string">
+        <xs:attribute name="isPermaLink" type="xs:boolean" use="optional" default="true"/>
+      </xs:extension>
+    </xs:simpleContent>
+  </xs:complexType>
+
+<!--
+TODO:
+- Need to add regexp pattern for MIME media-type value of tEnclosure/type
+- Need to add regexp pattern for checking contents of guid is a URL when isPermaLink=true"
+- Need to add some form of constraint to check on an item that one, or other, or both of title and description are present.
+  However, I'm not sure it is possible to represent these constraints in XML Schema language alone.
+- Need some way to enforce cardinality constraints preventing repeated elements in channels or items
+- Unfortunately the bug-fix for issue 10231 made this schema non-deterministic with respect to extensibitity elements.
+  We can't tell whether an extension element in tRssChannel is within the choice or after the item elements.
+  Need to reconsider the solution to bug-fix 10231.
+-->
+
+<!--
+Change Log:
+Date        Revision  Description
+31-Mar-2003   1       Initial version released for comment
+31-Mar-2003   2       Changes based on feedback from Gudge:
+                      - Remove targetNamespace="" and use elemenfFormDefault="unqualified" instead
+                      - Use namespace="##other" on <any>'s to create a more deterministic data model.
+                      - Added missing xs:documentation inside xs:annotation at the schema level.
+                      - Use xs:language for ISO Language Codes in <language> element.
+                      - Change guid to a single declaration.  This loses some of the checking of the 
+                        URL when the contents of the guid is a permaLink, so we will need to add 
+                        that back in with a regexp pattern.
+14-Apr-2003   3       Changes to solve some element ordering problems.
+                      - Use xs:all in place of xs:sequence to support flexible ordering of elements.
+                        Although the ordering constraints for elements is not clear from the 
+                        original specification, the custom and practice seems to be that 
+                        element ordering is freeform.
+                      - Use elemenfFormDefault="qualified" for explicit intent.
+15-Apr-2003   4       Changes to solve some element ordering problems.
+                      - Use xs:choice in place of xs:all as previous usage of <all> was invalid.
+                        This creates the problem that unsufficient constraints can be applied 
+                        by the schema - for example, it can't prevent two title elements for an item.
+                      - Use elemenfFormDefault="unqualified" for to get the correct behavious 
+                        when importing and combining schemas.
+15-Apr-2003   5       Putting the extensibility element inside the repeating choice solves 
+                        all problems with element ordering.
+15-Apr-2003   6       - skipHours and skipDays should contain a nested list of values, 
+                        not just a single value.
+                      - Added version attribute to schema definition.
+                      - Corrected type of the cloud element
+25-Apr-2003   7       - Add regexp for RFC-822 date suggested by Sam Ruby
+                      - I had to leave the base type of the tRfc822FormatDate type 
+                        as xs:string due to the problems with using 
+                        a pattern with xs:dateTime described at
+                        http://www.thearchitect.co.uk/weblog/archives/2003/04/000142.html
+19-Jun-2003   8       - Fixed a bug the Oxygen XML Editor spotted in the regexp for RFC-822 dates
+23-Jun-2003   9       - Added legal boilerplate license text for LGPL.
+                      - Minor formatting changes.
+24-Jun-2003  10       - Missing types for item/title and item/description - Spotted by Andreas Schwotzer.
+01-Jan-2008  11       - Copy made available under the Microsoft Public License (MS-PL).
+25-May-2008  12       - Bug fix 10231 from Ken Gruven - channel can contain zero or more items.
+06-Sep-2008  13       - Fixed tab-space whitespace issues. Now always use spaces. 
+                      - Undid the fix for bug-fix 10231 since it made the schema non-deterministic 
+                        with respect to extensibility eleemnts in tRssChannel - need to reconsider the fix.
+08-Sep-2008  14       - Removed 't' prefixes from type names to improve class names 
+                        that get code-generated from the schema. 
+22-Sep-2008  15       - Move type def for rss element in-line for improved compativility with Java 1.6 tools.
+01-Nov-2008  16       - Added the missing rating element from the spec to RssChannel.
+-->
+
+</xs:schema>
diff --git a/tests/test_command_import_wordpress.py b/tests/test_command_import_wordpress.py
new file mode 100644
index 0000000..4a30dba
--- /dev/null
+++ b/tests/test_command_import_wordpress.py
@@ -0,0 +1,92 @@
+# -*- coding: utf-8 -*-
+from __future__ import unicode_literals
+
+from context import nikola
+import os
+import unittest
+import mock
+
+
+class CommandImportWordpressTest(unittest.TestCase):
+    def setUp(self):
+        self.import_command = nikola.plugins.command_import_wordpress.CommandImportWordpress()
+        self.import_filename = os.path.abspath(
+            os.path.join(os.path.dirname(__file__),
+                         'wordpress_export_example.xml'))
+
+    def tearDown(self):
+        del self.import_command
+        del self.import_filename
+
+    def test_create_import_work_without_argument(self):
+        # Running this without an argument must not fail.
+        # It should show the proper usage of the command.
+        self.import_command.run()
+
+    def test_create_import(self):
+        data_import = mock.MagicMock()
+        site_generation = mock.MagicMock()
+        write_urlmap = mock.MagicMock()
+        write_configuration = mock.MagicMock()
+
+        with mock.patch('nikola.plugins.command_import_wordpress.CommandImportWordpress.generate_base_site', site_generation):
+            with mock.patch('nikola.plugins.command_import_wordpress.CommandImportWordpress.import_posts', data_import):
+                with mock.patch('nikola.plugins.command_import_wordpress.CommandImportWordpress.write_urlmap_csv', write_urlmap):
+                    with mock.patch('nikola.plugins.command_import_wordpress.CommandImportWordpress.write_configuration', write_configuration):
+                        self.import_command.run(self.import_filename)
+
+        self.assertTrue(site_generation.called)
+        self.assertTrue(data_import.called)
+
+    def test_populate_context(self):
+        channel = self.import_command.get_channel_from_file(
+            self.import_filename)
+        context = self.import_command.populate_context(channel)
+
+        for required_key in ('POST_PAGES', 'POST_COMPILERS'):
+            self.assertTrue(required_key in context)
+
+        self.assertEqual('de', context['DEFAULT_LANG'])
+        self.assertEqual('Wordpress blog title', context['BLOG_TITLE'])
+        self.assertEqual('Nikola test blog ;) - with moré Ümläüts', context['BLOG_DESCRIPTION'])
+        self.assertEqual('http://some.blog', context['BLOG_URL'])
+        self.assertEqual('mail@some.blog', context['BLOG_EMAIL'])
+        self.assertEqual('Niko', context['BLOG_AUTHOR'])
+
+    def test_importing_posts_and_attachments(self):
+        channel = self.import_command.get_channel_from_file(
+            self.import_filename)
+        self.import_command.context = self.import_command.populate_context(
+            channel)
+        self.import_command.url_map = {}  # For testing we use an empty one.
+
+        write_metadata = mock.MagicMock()
+        write_content = mock.MagicMock()
+        download_mock = mock.MagicMock()
+
+        with mock.patch('nikola.plugins.command_import_wordpress.CommandImportWordpress.write_content', write_content):
+            with mock.patch('nikola.plugins.command_import_wordpress.CommandImportWordpress.write_metadata', write_metadata):
+                with mock.patch('nikola.plugins.command_import_wordpress.CommandImportWordpress.download_url_content_to_file', download_mock):
+                    with mock.patch('nikola.plugins.command_import_wordpress.os.makedirs'):
+                        self.import_command.import_posts(channel)
+
+        self.assertTrue(download_mock.called)
+        download_mock.assert_any_call(u'http://some.blog/wp-content/uploads/2008/07/arzt_und_pfusch-sick-cover.png', u'new_site/files/wp-content/uploads/2008/07/arzt_und_pfusch-sick-cover.png')
+
+        self.assertTrue(write_metadata.called)
+        write_metadata.assert_any_call(u'new_site/stories/kontakt.meta', 'Kontakt', u'kontakt', '2009-07-16 20:20:32', None, [])
+
+        self.assertTrue(write_content.called)
+        write_content.assert_any_call(u'new_site/posts/200704hoert.wp', '...!\n\n\n\n[caption id="attachment_16" align="alignnone" width="739" caption="caption test"]<img class="size-full wp-image-16" title="caption test" src="http://some.blog/wp-content/uploads/2009/07/caption_test.jpg" alt="caption test" width="739" height="517" />[/caption]\n\n\n\nNicht, dass daran jemals Zweifel bestanden.')
+        write_content.assert_any_call(u'new_site/posts/200807arzt-und-pfusch-s-i-c-k.wp', u'<img class="size-full wp-image-10 alignright" title="Arzt+Pfusch - S.I.C.K." src="http://some.blog/wp-content/uploads/2008/07/arzt_und_pfusch-sick-cover.png" alt="Arzt+Pfusch - S.I.C.K." width="210" height="209" />Arzt+Pfusch - S.I.C.K.Gerade bin ich \xfcber das Album <em>S.I.C.K</em> von <a title="Arzt+Pfusch" href="http://www.arztpfusch.com/" target="_blank">Arzt+Pfusch</a> gestolpert, welches Arzt+Pfusch zum Download f\xfcr lau anbieten. Das Album steht unter einer Creative Commons <a href="http://creativecommons.org/licenses/by-nc-nd/3.0/de/">BY-NC-ND</a>-Lizenz.\n\nDie Ladung <em>noisebmstupidevildustrial</em> gibts als MP3s mit <a href="http://www.archive.org/download/dmp005/dmp005_64kb_mp3.zip">64kbps</a> und <a href="http://www.archive.org/download/dmp005/dmp005_vbr_mp3.zip">VBR</a>, als Ogg Vorbis und als FLAC (letztere <a href="http://www.archive.org/details/dmp005">hier</a>). <a href="http://www.archive.org/download/dmp005/dmp005-artwork.zip">Artwork</a> und <a href="http://www.archive.org/download/dmp005/dmp005-lyrics.txt">Lyrics</a> gibts nochmal einzeln zum Download.')
+        write_content.assert_any_call(u'new_site/stories/kontakt.wp', u'<h1>Datenschutz</h1>\n\nIch erhebe und speichere automatisch in meine Server Log Files Informationen, die dein Browser an mich \xfcbermittelt. Dies sind:\n\n<ul>\n\n    <li>Browsertyp und -version</li>\n\n    <li>verwendetes Betriebssystem</li>\n\n    <li>Referrer URL (die zuvor besuchte Seite)</li>\n\n    <li>IP Adresse des zugreifenden Rechners</li>\n\n    <li>Uhrzeit der Serveranfrage.</li>\n\n</ul>\n\nDiese Daten sind f\xfcr mich nicht bestimmten Personen zuordenbar. Eine Zusammenf\xfchrung dieser Daten mit anderen Datenquellen wird nicht vorgenommen, die Daten werden einzig zu statistischen Zwecken erhoben.')
+
+        self.assertTrue(len(self.import_command.url_map) > 0)
+
+        self.assertEqual(self.import_command.url_map['http://some.blog/2007/04/hoert/'], u'http://some.blog/posts/200704hoert.html')
+        self.assertEqual(self.import_command.url_map['http://some.blog/2008/07/arzt-und-pfusch-s-i-c-k/'], u'http://some.blog/posts/200807arzt-und-pfusch-s-i-c-k.html')
+        self.assertEqual(self.import_command.url_map['http://some.blog/kontakt/'], u'http://some.blog/stories/kontakt.html')
+
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/test_rss_feeds.py b/tests/test_rss_feeds.py
new file mode 100644
index 0000000..2b48f36
--- /dev/null
+++ b/tests/test_rss_feeds.py
@@ -0,0 +1,104 @@
+# -*- coding: utf-8 -*-
+
+import unittest
+import os
+import re
+from StringIO import StringIO
+
+import mock
+
+from context import nikola
+from lxml import etree
+
+
+class RSSFeedTest(unittest.TestCase):
+    def setUp(self):
+        self.blog_url = "http://some.blog"
+
+        with mock.patch('nikola.nikola.utils.get_meta',
+                        mock.Mock(return_value=('post title',
+                                                'awesome_article',
+                                                '2012-10-01 22:41', 'tags',
+                                                'link', 'description'))):
+            with mock.patch('nikola.nikola.utils.os.path.isdir',
+                            mock.Mock(return_value=True)):
+                with mock.patch('nikola.nikola.Post.text',
+                                mock.Mock(return_value='some long text')):
+
+                    example_post = nikola.nikola.Post('source.file',
+                                                      'cache',
+                                                      'blog_folder',
+                                                      True,
+                                                      {'en': ''},
+                                                      'en',
+                                                      self.blog_url,
+                                                      'unused message.')
+
+                    opener_mock = mock.mock_open()
+
+                    with mock.patch('nikola.nikola.utils.open', opener_mock, create=True):
+                        nikola.nikola.utils.generic_rss_renderer('en',
+                                                                 "blog_title",
+                                                                 self.blog_url,
+                                                                 "blog_description",
+                                                                 [example_post,
+                                                                  ],
+                                                                 'testfeed.rss')
+
+                    self.file_content = ''.join(
+                        [call[1][0] for call in opener_mock.mock_calls[2:-1]])
+
+    def tearDown(self):
+        pass
+
+    def test_feed_items_have_valid_URLs(self):
+        '''The items in the feed need to have valid urls in link and guid.'''
+        # This validation regex is taken from django.core.validators
+        url_validation_regex = re.compile(r'^(?:http|ftp)s?://'  # http:// or https://
+                                          r'(?:(?:[A-Z0-9](?:[A-Z0-9-]{0,61}[A-Z0-9])?\.)+(?:[A-Z]{2,6}\.?|[A-Z0-9-]{2,}\.?)|'  # domain...
+                                          r'localhost|'  # localhost...
+                                          r'\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}|'  # ...or ipv4
+                                          r'\[?[A-F0-9]*:[A-F0-9:]+\]?)'  # ...or ipv6
+                                          r'(?::\d+)?'  # optional port
+                                          r'(?:/?|[/?]\S+)$', re.IGNORECASE)
+
+        def is_valid_URL(url):
+            return url_validation_regex.match(url) is not None
+
+        et = etree.parse(StringIO(self.file_content))
+        channel = et.find('channel')
+        item = channel.find('item')
+        guid = item.find('guid')
+        link = item.find('link')
+
+        # As stated by W3 FEED Validator: "link must be a full and valid URL"
+        self.assertTrue(is_valid_URL(link.text),
+                        'The following URL is not valid: %s' % link.text)
+        self.assertTrue(self.blog_url in link.text)
+
+        # "guid must be a full URL, unless isPermaLink attribute
+        # is false: /weblog/posts/the-minimal-server.html "
+        self.assertTrue(is_valid_URL(guid.text),
+                        'The following URL is not valid: %s' %
+                        guid.text)
+        self.assertTrue(self.blog_url in guid.text)
+
+    def test_feed_is_valid(self):
+        '''
+        A testcase to check if the generated feed is valid.
+
+        Validation can be tested with W3 FEED Validator that can be found
+        at http://feedvalidator.org
+        '''
+        rss_schema_filename = os.path.join(os.path.dirname(__file__),
+                                           'rss-2_0.xsd')
+        with open(rss_schema_filename, 'r') as rss_schema_file:
+            xmlschema_doc = etree.parse(rss_schema_file)
+
+        xmlschema = etree.XMLSchema(xmlschema_doc)
+        document = etree.parse(StringIO(self.file_content))
+
+        self.assertTrue(xmlschema.validate(document))
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/tests/wordpress_export_example.xml b/tests/wordpress_export_example.xml
new file mode 100644
index 0000000..7517193
--- /dev/null
+++ b/tests/wordpress_export_example.xml
@@ -0,0 +1,174 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!-- This is a WordPress eXtended RSS file generated by WordPress as an export of your site. -->
+<rss version="2.0"
+    xmlns:excerpt="http://wordpress.org/export/1.2/excerpt/"
+    xmlns:content="http://purl.org/rss/1.0/modules/content/"
+    xmlns:wfw="http://wellformedweb.org/CommentAPI/"
+    xmlns:dc="http://purl.org/dc/elements/1.1/"
+    xmlns:wp="http://wordpress.org/export/1.2/"
+>
+
+<channel>
+    <title>Wordpress blog title</title>
+    <link>http://some.blog</link>
+    <description>Nikola test blog ;) - with moré Ümläüts</description>
+    <pubDate>Wed, 25 Jul 2012 22:31:24 +0000</pubDate>
+    <language>de-DE</language>
+    <wp:wxr_version>1.2</wp:wxr_version>
+    <wp:base_site_url>http://some.blog</wp:base_site_url>
+    <wp:base_blog_url>http://some.blog</wp:base_blog_url>
+
+    <wp:author><wp:author_id>2</wp:author_id><wp:author_login>Niko</wp:author_login><wp:author_email>mail@some.blog</wp:author_email><wp:author_display_name><![CDATA[Niko]]></wp:author_display_name><wp:author_first_name><![CDATA[Niko]]></wp:author_first_name><wp:author_last_name><![CDATA[]]></wp:author_last_name></wp:author>
+
+    <wp:category><wp:term_id>11</wp:term_id><wp:category_nicename>programmierung</wp:category_nicename><wp:category_parent></wp:category_parent><wp:cat_name><![CDATA[c0ding]]></wp:cat_name></wp:category>
+    <wp:tag><wp:term_id>501</wp:term_id><wp:tag_slug>dotnet</wp:tag_slug><wp:tag_name><![CDATA[.Net]]></wp:tag_name></wp:tag>
+
+    <generator>http://wordpress.org/?v=3.4.1</generator>
+
+    <item>
+        <title>Arzt+Pfusch - S.I.C.K.</title>
+        <link>http://some.blog/2008/07/arzt-und-pfusch-s-i-c-k/arzt_und_pfusch-sick-cover/</link>
+        <pubDate>Thu, 16 Jul 2009 19:40:37 +0000</pubDate>
+        <dc:creator>Niko</dc:creator>
+        <guid isPermaLink="false">http://some.blog/wp-content/uploads/2008/07/arzt_und_pfusch-sick-cover.png</guid>
+        <description></description>
+        <content:encoded><![CDATA[Das Cover von Arzt+Pfusch - S.I.C.K.]]></content:encoded>
+        <excerpt:encoded><![CDATA[Arzt+Pfusch - S.I.C.K.]]></excerpt:encoded>
+        <wp:post_id>10</wp:post_id>
+        <wp:post_date>2009-07-16 21:40:37</wp:post_date>
+        <wp:post_date_gmt>2009-07-16 19:40:37</wp:post_date_gmt>
+        <wp:comment_status>open</wp:comment_status>
+        <wp:ping_status>open</wp:ping_status>
+        <wp:post_name>arzt_und_pfusch-sick-cover</wp:post_name>
+        <wp:status>inherit</wp:status>
+        <wp:post_parent>6</wp:post_parent>
+        <wp:menu_order>0</wp:menu_order>
+        <wp:post_type>attachment</wp:post_type>
+        <wp:post_password></wp:post_password>
+        <wp:is_sticky>0</wp:is_sticky>
+        <wp:attachment_url>http://some.blog/wp-content/uploads/2008/07/arzt_und_pfusch-sick-cover.png</wp:attachment_url>
+        <wp:postmeta>
+            <wp:meta_key>_wp_attached_file</wp:meta_key>
+            <wp:meta_value><![CDATA[2008/07/arzt_und_pfusch-sick-cover.png]]></wp:meta_value>
+        </wp:postmeta>
+        <wp:postmeta>
+            <wp:meta_key>_wp_attachment_metadata</wp:meta_key>
+            <wp:meta_value><![CDATA[a:6:{s:5:"width";s:3:"300";s:6:"height";s:3:"299";s:14:"hwstring_small";s:22:"height='96' width='96'";s:4:"file";s:38:"2008/07/arzt_und_pfusch-sick-cover.png";s:5:"sizes";a:1:{s:9:"thumbnail";a:3:{s:4:"file";s:38:"arzt_und_pfusch-sick-cover-150x150.png";s:5:"width";s:3:"150";s:6:"height";s:3:"150";}}s:10:"image_meta";a:10:{s:8:"aperture";s:1:"0";s:6:"credit";s:0:"";s:6:"camera";s:0:"";s:7:"caption";s:0:"";s:17:"created_timestamp";s:1:"0";s:9:"copyright";s:0:"";s:12:"focal_length";s:1:"0";s:3:"iso";s:1:"0";s:13:"shutter_speed";s:1:"0";s:5:"title";s:0:"";}}]]></wp:meta_value>
+        </wp:postmeta>
+    </item>
+
+    <item>
+        <title>Caption test</title>
+        <link>http://some.blog/2007/04/hoert/</link>
+        <pubDate>Fri, 27 Apr 2007 13:02:35 +0000</pubDate>
+        <dc:creator>Niko</dc:creator>
+        <guid isPermaLink="false">http://some.blog/?p=17</guid>
+        <description></description>
+        <content:encoded><![CDATA[...!
+
+[caption id="attachment_16" align="alignnone" width="739" caption="caption test"]<img class="size-full wp-image-16" title="caption test" src="http://some.blog/wp-content/uploads/2009/07/caption_test.jpg" alt="caption test" width="739" height="517" />[/caption]
+
+Nicht, dass daran jemals Zweifel bestanden.]]></content:encoded>
+        <excerpt:encoded><![CDATA[]]></excerpt:encoded>
+        <wp:post_id>17</wp:post_id>
+        <wp:post_date>2007-04-27 15:02:35</wp:post_date>
+        <wp:post_date_gmt>2007-04-27 13:02:35</wp:post_date_gmt>
+        <wp:comment_status>open</wp:comment_status>
+        <wp:ping_status>open</wp:ping_status>
+        <wp:post_name>hoert</wp:post_name>
+        <wp:status>publish</wp:status>
+        <wp:post_parent>0</wp:post_parent>
+        <wp:menu_order>0</wp:menu_order>
+        <wp:post_type>post</wp:post_type>
+        <wp:post_password></wp:post_password>
+        <wp:is_sticky>0</wp:is_sticky>
+        <category domain="post_tag" nicename="bild"><![CDATA[Bild]]></category>
+        <category domain="category" nicename="musik"><![CDATA[Musik]]></category>
+        <category domain="category" nicename="unterhaltung"><![CDATA[Unterhaltung]]></category>
+        <category domain="post_tag" nicename="werbung"><![CDATA[Werbung]]></category>
+        <wp:postmeta>
+            <wp:meta_key>_edit_last</wp:meta_key>
+            <wp:meta_value><![CDATA[2]]></wp:meta_value>
+        </wp:postmeta>
+    </item>
+
+    <item>
+        <title>Arzt+Pfusch - S.I.C.K.</title>
+        <link>http://some.blog/2008/07/arzt-und-pfusch-s-i-c-k/</link>
+        <pubDate>Sat, 12 Jul 2008 19:22:06 +0000</pubDate>
+        <dc:creator>Niko</dc:creator>
+        <guid isPermaLink="false">http://some.blog/?p=6</guid>
+        <description></description>
+        <content:encoded><![CDATA[<img class="size-full wp-image-10 alignright" title="Arzt+Pfusch - S.I.C.K." src="http://some.blog/wp-content/uploads/2008/07/arzt_und_pfusch-sick-cover.png" alt="Arzt+Pfusch - S.I.C.K." width="210" height="209" />Arzt+Pfusch - S.I.C.K.Gerade bin ich über das Album <em>S.I.C.K</em> von <a title="Arzt+Pfusch" href="http://www.arztpfusch.com/" target="_blank">Arzt+Pfusch</a> gestolpert, welches Arzt+Pfusch zum Download für lau anbieten. Das Album steht unter einer Creative Commons <a href="http://creativecommons.org/licenses/by-nc-nd/3.0/de/">BY-NC-ND</a>-Lizenz.
+Die Ladung <em>noisebmstupidevildustrial</em> gibts als MP3s mit <a href="http://www.archive.org/download/dmp005/dmp005_64kb_mp3.zip">64kbps</a> und <a href="http://www.archive.org/download/dmp005/dmp005_vbr_mp3.zip">VBR</a>, als Ogg Vorbis und als FLAC (letztere <a href="http://www.archive.org/details/dmp005">hier</a>). <a href="http://www.archive.org/download/dmp005/dmp005-artwork.zip">Artwork</a> und <a href="http://www.archive.org/download/dmp005/dmp005-lyrics.txt">Lyrics</a> gibts nochmal einzeln zum Download.]]></content:encoded>
+        <excerpt:encoded><![CDATA[]]></excerpt:encoded>
+        <wp:post_id>6</wp:post_id>
+        <wp:post_date>2008-07-12 21:22:06</wp:post_date>
+        <wp:post_date_gmt>2008-07-12 19:22:06</wp:post_date_gmt>
+        <wp:comment_status>open</wp:comment_status>
+        <wp:ping_status>open</wp:ping_status>
+        <wp:post_name>arzt-und-pfusch-s-i-c-k</wp:post_name>
+        <wp:status>publish</wp:status>
+        <wp:post_parent>0</wp:post_parent>
+        <wp:menu_order>0</wp:menu_order>
+        <wp:post_type>post</wp:post_type>
+        <wp:post_password></wp:post_password>
+        <wp:is_sticky>0</wp:is_sticky>
+        <category domain="post_tag" nicename="arzt-und-pfusch"><![CDATA[Arzt+Pfusch]]></category>
+        <category domain="post_tag" nicename="creative-commons"><![CDATA[Creative Commons]]></category>
+        <category domain="post_tag" nicename="download"><![CDATA[Download]]></category>
+        <category domain="post_tag" nicename="electronic-body-music"><![CDATA[EBM]]></category>
+        <category domain="post_tag" nicename="flac"><![CDATA[Free Lossless Audio Codec]]></category>
+        <category domain="post_tag" nicename="gratis"><![CDATA[Gratis]]></category>
+        <category domain="post_tag" nicename="industrial"><![CDATA[Industrial]]></category>
+        <category domain="post_tag" nicename="mp3"><![CDATA[MP3]]></category>
+        <category domain="category" nicename="musik"><![CDATA[Musik]]></category>
+        <category domain="post_tag" nicename="ogg"><![CDATA[Ogg]]></category>
+        <wp:postmeta>
+            <wp:meta_key>_edit_last</wp:meta_key>
+            <wp:meta_value><![CDATA[2]]></wp:meta_value>
+        </wp:postmeta>
+    </item>
+
+        <item>
+        <title>Kontakt</title>
+        <link>http://some.blog/kontakt/</link>
+        <pubDate>Thu, 16 Jul 2009 18:20:32 +0000</pubDate>
+        <dc:creator>Niko</dc:creator>
+        <guid isPermaLink="false">http://some.blog/?page_id=3</guid>
+        <description></description>
+        <content:encoded><![CDATA[<h1>Datenschutz</h1>
+Ich erhebe und speichere automatisch in meine Server Log Files Informationen, die dein Browser an mich übermittelt. Dies sind:
+<ul>
+    <li>Browsertyp und -version</li>
+    <li>verwendetes Betriebssystem</li>
+    <li>Referrer URL (die zuvor besuchte Seite)</li>
+    <li>IP Adresse des zugreifenden Rechners</li>
+    <li>Uhrzeit der Serveranfrage.</li>
+</ul>
+Diese Daten sind für mich nicht bestimmten Personen zuordenbar. Eine Zusammenführung dieser Daten mit anderen Datenquellen wird nicht vorgenommen, die Daten werden einzig zu statistischen Zwecken erhoben.]]></content:encoded>
+        <excerpt:encoded><![CDATA[]]></excerpt:encoded>
+        <wp:post_id>3</wp:post_id>
+        <wp:post_date>2009-07-16 20:20:32</wp:post_date>
+        <wp:post_date_gmt>2009-07-16 18:20:32</wp:post_date_gmt>
+        <wp:comment_status>closed</wp:comment_status>
+        <wp:ping_status>closed</wp:ping_status>
+        <wp:post_name>kontakt</wp:post_name>
+        <wp:status>publish</wp:status>
+        <wp:post_parent>0</wp:post_parent>
+        <wp:menu_order>0</wp:menu_order>
+        <wp:post_type>page</wp:post_type>
+        <wp:post_password></wp:post_password>
+        <wp:is_sticky>0</wp:is_sticky>
+        <wp:postmeta>
+            <wp:meta_key>_edit_last</wp:meta_key>
+            <wp:meta_value><![CDATA[2]]></wp:meta_value>
+        </wp:postmeta>
+        <wp:postmeta>
+            <wp:meta_key>_wp_page_template</wp:meta_key>
+            <wp:meta_value><![CDATA[default]]></wp:meta_value>
+        </wp:postmeta>
+    </item>
+
+</channel>
+</rss>
diff --git a/tests/wordpress_unicode_export.xml b/tests/wordpress_unicode_export.xml
new file mode 100644
index 0000000..b2204fc
--- /dev/null
+++ b/tests/wordpress_unicode_export.xml
@@ -0,0 +1,114 @@
+<?xml version="1.0" encoding="UTF-8" ?>
+<!-- This is a WordPress eXtended RSS file generated by WordPress as an export of your site. -->
+<!-- It contains information about your site's posts, pages, comments, categories, and other content. -->
+<!-- You may use this file to transfer that content from one site to another. -->
+<!-- This file is not intended to serve as a complete backup of your site. -->
+
+<!-- To import this information into a WordPress site follow these steps: -->
+<!-- 1. Log in to that site as an administrator. -->
+<!-- 2. Go to Tools: Import in the WordPress admin panel. -->
+<!-- 3. Install the "WordPress" importer from the list. -->
+<!-- 4. Activate & Run Importer. -->
+<!-- 5. Upload this file using the form provided on that page. -->
+<!-- 6. You will first be asked to map the authors in this export file to users -->
+<!--    on the site. For each author, you may choose to map to an -->
+<!--    existing user on the site or to create a new user. -->
+<!-- 7. WordPress will then import each of the posts, pages, comments, categories, etc. -->
+<!--    contained in this file into your site. -->
+
+<!-- generator="WordPress.com" created="2012-12-25 21:39"-->
+<rss version="2.0"
+	xmlns:excerpt="http://wordpress.org/export/1.2/excerpt/"
+	xmlns:content="http://purl.org/rss/1.0/modules/content/"
+	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
+	xmlns:dc="http://purl.org/dc/elements/1.1/"
+	xmlns:wp="http://wordpress.org/export/1.2/"
+>
+
+<channel>
+	<title>Nikola Unicode Test Íµpó®t</title>
+	<link>http://nikolaunicode.wordpress.com</link>
+	<description>The greatest WordPress.com site in all the land!</description>
+	<pubDate>Tue, 25 Dec 2012 21:39:30 +0000</pubDate>
+	<language>en</language>
+	<wp:wxr_version>1.2</wp:wxr_version>
+	<wp:base_site_url>http://wordpress.com/</wp:base_site_url>
+	<wp:base_blog_url>http://nikolaunicode.wordpress.com</wp:base_blog_url>
+
+	<wp:author><wp:author_id>3804924</wp:author_id><wp:author_login>ralsina</wp:author_login><wp:author_email>roberto.alsina@gmail.com</wp:author_email><wp:author_display_name><![CDATA[ralsina]]></wp:author_display_name><wp:author_first_name><![CDATA[]]></wp:author_first_name><wp:author_last_name><![CDATA[]]></wp:author_last_name></wp:author>
+
+	<wp:category><wp:term_id>1</wp:term_id><wp:category_nicename>uncategorized</wp:category_nicename><wp:category_parent></wp:category_parent><wp:cat_name><![CDATA[Uncategorized]]></wp:cat_name></wp:category>
+	<wp:tag><wp:term_id>132937998</wp:term_id><wp:tag_slug>thag1</wp:tag_slug><wp:tag_name><![CDATA[þág1]]></wp:tag_name></wp:tag>
+	<wp:tag><wp:term_id>132937999</wp:term_id><wp:tag_slug>thag%c2%b2</wp:tag_slug><wp:tag_name><![CDATA[þág²]]></wp:tag_name></wp:tag>
+
+	<generator>http://wordpress.com/</generator>
+<cloud domain='nikolaunicode.wordpress.com' port='80' path='/?rsscloud=notify' registerProcedure='' protocol='http-post' />
+<image>
+		<url>https://s2.wp.com/i/buttonw-com.png</url>
+		<title>Nikola Unicode Test Íµpó®t</title>
+		<link>http://nikolaunicode.wordpress.com</link>
+	</image>
+	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://nikolaunicode.wordpress.com/osd.xml" title="Nikola Unicode Test Íµpó®t" />
+	<atom:link rel='hub' href='http://nikolaunicode.wordpress.com/?pushpress=hub'/>
+
+	<item>
+		<title>About</title>
+		<link>http://nikolaunicode.wordpress.com/about/</link>
+		<pubDate>Tue, 25 Dec 2012 21:36:15 +0000</pubDate>
+		<dc:creator>ralsina</dc:creator>
+		<guid isPermaLink="false">http://nikolaunicode.wordpress.com/?page_id=1</guid>
+		<description></description>
+		<content:encoded><![CDATA[This is an example of a page. Unlike posts, which are displayed on your blog’s front page in the order they’re published, pages are better suited for more timeless content that you want to be easily accessible, like your About or Contact information. Click the Edit link to make changes to this page or <a title="Direct link to Add New in the Admin Dashboard" href="/wp-admin/post-new.php?post_type=page">add another page</a>.]]></content:encoded>
+		<excerpt:encoded><![CDATA[]]></excerpt:encoded>
+		<wp:post_id>1</wp:post_id>
+		<wp:post_date>2012-12-25 21:36:15</wp:post_date>
+		<wp:post_date_gmt>2012-12-25 21:36:15</wp:post_date_gmt>
+		<wp:comment_status>open</wp:comment_status>
+		<wp:ping_status>open</wp:ping_status>
+		<wp:post_name>about</wp:post_name>
+		<wp:status>publish</wp:status>
+		<wp:post_parent>0</wp:post_parent>
+		<wp:menu_order>0</wp:menu_order>
+		<wp:post_type>page</wp:post_type>
+		<wp:post_password></wp:post_password>
+		<wp:is_sticky>0</wp:is_sticky>
+	</item>
+	<item>
+		<title>Úñî©òðé title</title>
+		<link>http://nikolaunicode.wordpress.com/2012/12/25/uniode-title/</link>
+		<pubDate>Tue, 25 Dec 2012 21:38:37 +0000</pubDate>
+		<dc:creator>ralsina</dc:creator>
+		<guid isPermaLink="false">http://nikolaunicode.wordpress.com/?p=3</guid>
+		<description></description>
+		<content:encoded><![CDATA[Mó®é úñí©óðé]]></content:encoded>
+		<excerpt:encoded><![CDATA[]]></excerpt:encoded>
+		<wp:post_id>3</wp:post_id>
+		<wp:post_date>2012-12-25 21:38:37</wp:post_date>
+		<wp:post_date_gmt>2012-12-25 21:38:37</wp:post_date_gmt>
+		<wp:comment_status>open</wp:comment_status>
+		<wp:ping_status>open</wp:ping_status>
+		<wp:post_name>uniode-title</wp:post_name>
+		<wp:status>publish</wp:status>
+		<wp:post_parent>0</wp:post_parent>
+		<wp:menu_order>0</wp:menu_order>
+		<wp:post_type>post</wp:post_type>
+		<wp:post_password></wp:post_password>
+		<wp:is_sticky>0</wp:is_sticky>
+		<category domain="post_tag" nicename="thag1"><![CDATA[þág1]]></category>
+		<category domain="post_tag" nicename="thag%c2%b2"><![CDATA[þág²]]></category>
+		<category domain="category" nicename="uncategorized"><![CDATA[Uncategorized]]></category>
+		<wp:postmeta>
+			<wp:meta_key>_edit_last</wp:meta_key>
+			<wp:meta_value><![CDATA[3804924]]></wp:meta_value>
+		</wp:postmeta>
+		<wp:postmeta>
+			<wp:meta_key>_publicize_pending</wp:meta_key>
+			<wp:meta_value><![CDATA[1]]></wp:meta_value>
+		</wp:postmeta>
+		<wp:postmeta>
+			<wp:meta_key>jabber_published</wp:meta_key>
+			<wp:meta_value><![CDATA[1356471518]]></wp:meta_value>
+		</wp:postmeta>
+	</item>
+</channel>
+</rss>
-- 
cgit v1.2.3