The gta tool requires document and annotation file sets. When working on a tagtog project, files like this one or the annotation one are created, one of each per worked document.
The documents that contain the text (html file) to be displayed can have two differents structures. The first accepted structure of the file is displayed:
<!DOCTYPE html >
<html id="tagtogId-document_title.txt" data-origid="document_title.txt" class="anndoc" data-anndoc-version="3.6" lang="" xml:lang="" xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta charset="UTF-8"/>
<meta name="generator" content="net.tagtog.anndoc.v3.parsers.general.VerbatimParser_v1_0_1"/>
<title>tagtogId-document_title.txt</title>
</head>
<body>
<article>
<section data-type="">
<div class="content">
<pre id="s1v1">Document content</pre>
</div>
</section>
</article>
</body>
</html>
The second accepted structure of the file is displayed:
<!DOCTYPE html >
<html id="tagtogId-document_title.txt" data-origid="document_title.txt" class="anndoc" data-anndoc-version="3.6" lang="" xml:lang="" xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta charset="UTF-8"/>
<meta name="generator" content="net.tagtog.anndoc.v3.parsers.general.VerbatimParser_v1_0_1"/>
<title>tagtogId-document_title.txt</title>
</head>
<body>
<article>
<section data-type="">
<div class="content">
<p id="s1p1">Paragraph content</p>
<p id="s1p2">Paragraph content</p>
<p id="s1p3">Paragraph content</p>
</div>
</section>
</article>
</body>
</html>
And finally, for the annotation files they must be in the JSON format with the following structure:
{
"annotatable": {
"parts": ["s1v1"]
},
"anncomplete": true,
"sources": [],
"metas": {},
"entities": [
{
"classId": "e_4",
"part": "s1v1",
"offsets": [{
"start": 12,
"text": "toponymName"
}],
"coordinates": [],
"confidence": {
"state": "pre-added",
"who": ["user:tagtogUsername"],
"prob": 1
},
"fields": {
"f_23": {
"value": "toponym",
"confidence": {
"state": "pre-added",
"who": ["user:tagtogUsername"],
"prob": 1
}
}
},
"normalizations": {}
},
{
"classId": "e_4",
"part": "s1v1",
"offsets": [{
"start": 132,
"text": "toponymName"
}],
"coordinates": [],
"confidence": {
"state": "pre-added",
"who": ["user:tagtogUsername"],
"prob": 1
},
"fields": {
"f_23": {
"value": "toponym",
"confidence": {
"state": "pre-added",
"who": ["user:tagtogUsername"],
"prob": 1
}
}
},
"normalizations": {}
},
...
],
"relations": []
}