aboutsummaryrefslogtreecommitdiffstats
path: root/python_hadoop/tests/files/small.xml
blob: 78b9ba2d2321a2fe57f06787fd093f3672cb24e4 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
<?xml version="1.0" encoding="UTF-8"?>
<TEI xmlns="http://www.tei-c.org/ns/1.0" 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" 
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 /srv/grobid/grobid-0.5.1/grobid-home/schemas/xsd/Grobid.xsd"
 xmlns:xlink="http://www.w3.org/1999/xlink">
	<teiHeader xml:lang="en">
		<encodingDesc>
			<appInfo>
				<application version="0.5.1-SNAPSHOT" ident="GROBID" when="2018-04-02T00:31+0000">
					<ref target="https://github.com/kermitt2/grobid">GROBID - A machine learning software for extracting information from scholarly documents</ref>
				</application>
			</appInfo>
		</encodingDesc>
		<fileDesc>
			<titleStmt>
				<title level="a" type="main">Dummy Example File</title>
			</titleStmt>
			<publicationStmt>
				<publisher/>
				<availability status="unknown"><licence/></availability>
				<date type="published" when="2000">2000</date>
			</publicationStmt>
			<sourceDesc>
				<biblStruct>
					<analytic>
						<author>
							<persName xmlns="http://www.tei-c.org/ns/1.0"><forename type="first">Brewster</forename><surname>Kahle</surname></persName>
						</author>
						<author>
							<persName xmlns="http://www.tei-c.org/ns/1.0"><forename type="first">J</forename><surname>Doe</surname></persName>
						</author>
						<author>
							<affiliation key="aff0">
								<orgName type="institution">Internet Archive</orgName>
							</affiliation>
						</author>
						<title level="a" type="main">Dummy Example File</title>
					</analytic>
					<monogr>
						<title level="m">Dummy Example File. Journal of Fake News. pp. 1-2. ISSN 1234-5678</title>
						<imprint>
							<date type="published" when="2000">2000</date>
						</imprint>
					</monogr>
				</biblStruct>
			</sourceDesc>
		</fileDesc>
		<profileDesc>
			<textClass>
				<keywords>
					<term>Fake Data</term>
				</keywords>
			</textClass>
			<abstract>
				<p>Everything you ever wanted to know about nothing</p>
			</abstract>
		</profileDesc>
	</teiHeader>
	<text xml:lang="en">
		<body>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="1">Introduction</head><p>
Everything starts somewhere, as somebody<ref type="bibr" target="#b0">[1]</ref> once said.</p></div>

<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2">In Depth</head></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.1">Meat</head><p>
You know, for kids.</p></div>
<div xmlns="http://www.tei-c.org/ns/1.0"><head n="2.2">Potatos</head><p>
QED.</p></div>
		</body>
		<back>
			<div type="references">

				<listBibl>

<biblStruct xml:id="b0">
	<analytic>
		<title level="a" type="main">Everything is Wonderful</title>
		<author>
			<persName xmlns="http://www.tei-c.org/ns/1.0"><forename type="middle">A</forename><surname>Seaperson</surname></persName>
		</author>
	</analytic>
	<monogr>
		<title level="j">Letters in the Alphabet</title>
		<imprint>
			<biblScope unit="volume">20</biblScope>
			<biblScope unit="page" from="1" to="11" />
			<date type="published" when="2001" />
		</imprint>
	</monogr>
</biblStruct>

<biblStruct xml:id="b1">
	<analytic>
		<title level="a" type="main">All about Facts</title>
	</analytic>
	<monogr>
		<title level="j">The Dictionary</title>
		<imprint>
			<biblScope unit="volume">14</biblScope>
			<date type="published" when="2011-03-28" />
		</imprint>
	</monogr>
	<note>None</note>
</biblStruct>

				</listBibl>
			</div>
		</back>
	</text>
</TEI>