1 <mediawiki xmlns=
"http://www.mediawiki.org/xml/export-0.3/" xmlns:
xsi=
"http://www.w3.org/2001/XMLSchema-instance" xsi:
schemaLocation=
"http://www.mediawiki.org/xml/export-0.3/ http://www.mediawiki.org/xml/export-0.3.xsd" version=
"0.3" xml:
lang=
"en">
3 <!-- Optional global configuration info -->
5 <!-- Site name, as set in $wgSitename -->
6 <sitename>DemoWiki
</sitename>
8 <!-- Forgot where you got this set? -->
9 <base>http://example.com/wiki/Main_Page
</base>
11 <!-- Source software version -->
12 <generator>MediaWiki
1.5.0</generator>
14 <!-- Title case sensitivity options of the wiki this data came from -->
15 <!-- May be 'first-letter', 'case-sensitive', or 'case-insensitive' -->
16 <case>first-letter
</case>
18 <!-- Defined namespace keys on the source wiki. -->
19 <!-- Titles can be substring-split to obtain the symbolic numeric key -->
21 <namespace key=
"-2">Media
</namespace>
22 <namespace key=
"-1">Special
</namespace>
23 <namespace key=
"0"></namespace>
24 <namespace key=
"1">Talk
</namespace>
25 <namespace key=
"2">User
</namespace>
26 <namespace key=
"3">User talk
</namespace>
27 <namespace key=
"4">DemoWiki
</namespace>
28 <namespace key=
"5">DemoWIki talk
</namespace>
29 <namespace key=
"6">Image
</namespace>
30 <namespace key=
"7">Image talk
</namespace>
31 <namespace key=
"8">MediaWiki
</namespace>
32 <namespace key=
"9">MediaWiki talk
</namespace>
33 <namespace key=
"10">Template
</namespace>
34 <namespace key=
"11">Template talk
</namespace>
35 <namespace key=
"12">Help
</namespace>
36 <namespace key=
"13">Help talk
</namespace>
37 <namespace key=
"14">Category
</namespace>
38 <namespace key=
"15">Category talk
</namespace>
42 <!-- The rest of the data will be a series of page records -->
44 <!-- Titles are listed here in text form, with namespace prefix -->
45 <!-- if any, and spaces rather than the underscores used in URLs. -->
46 <title>Page title
</title>
48 <!-- The page's immutable page_id number in the source database. -->
49 <!-- Page ID numbers are kept across page moves, but may change -->
50 <!-- if a page is deleted and recreated. -->
53 <!-- If restricted, the ACL is listed here raw. -->
54 <restrictions>edit=sysop:move=sysop
</restrictions>
56 <!-- With a series of revision records... -->
58 <!-- Remember this is XML; if you must use a regex-based extractor -->
59 <!-- in place of a standard XML parser, be very careful. -->
60 <!-- * Don't forget to decode character entities! -->
61 <!-- * If using a 'loose' XML parser, ensure that whitespace is -->
62 <!-- preserved in the <text> elements. -->
64 <!-- Unique revision ID number (rev_id) in the source database. -->
65 <!-- This number uniquely identifies the revision on that wiki. -->
68 <timestamp>2001-
01-
15T13:
15:
00Z
</timestamp>
69 <contributor><username>Foobar
</username><id>42</id></contributor>
71 <comment>I have just one thing to say!
</comment>
72 <text xml:
space=
"preserve">A bunch of [[text]] here.
</text>
76 <timestamp>2001-
01-
15T13:
10:
27Z
</timestamp>
77 <contributor><ip>10.0.0.2</ip></contributor>
78 <comment>new!
</comment>
79 <text xml:
space=
"preserve">An earlier [[revision]].
</text>
84 <title>Talk:Page title
</title>
88 <timestamp>2001-
01-
15T14:
03:
00Z
</timestamp>
89 <contributor><ip>10.0.0.2</ip></contributor>
90 <comment>hey
</comment>
91 <text xml:
space=
"preserve">WHYD YOU LOCK PAGE??!!! i was editing that jerk
</text>
96 <title>Image:Some image.jpg
</title>
100 <timestamp>2001-
01-
15T20:
34:
12Z
</timestamp>
101 <contributor><username>Foobar
</username><id>42</id></contributor>
102 <comment>My awesomeest image!
</comment>
103 <text xml:
space=
"preserve">This is an awesome little imgae. I lurves it. {{PD}}
</text>
106 <timestamp>2001-
01-
15T20:
34:
12Z
</timestamp>
107 <contributor><username>Foobar
</username><id>42</id></contributor>
108 <comment>My awesomeest image!
</comment>
109 <filename>Some_image.jpg
</filename>
110 <src>http://upload.wikimedia.org/commons/
2/
22/Some_image.jpg
</src>