-
Notifications
You must be signed in to change notification settings - Fork 3
/
params.json
33 lines (33 loc) · 1.79 KB
/
params.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
{
"api" : "http://xxx.xxx.xxx.xxx:8888/extra/api",
"taxonomies": [
{
"name": "IPTC Media Topics",
"language": "english",
"topics_file" : "topics/IPTC-Media-Topics-english.txt",
"rules_file":"rules/IPTC-Media-Topics-english.txt",
"corpora": [
{
"corpus_name": "Reuters",
"language": "english",
"schema" : {"fields":[{"hasParagraphs":false,"hasSentences":true,"name":"title","textual":true},{"hasParagraphs":true,"hasSentences":true,"name":"body","textual":true},{"hasParagraphs":false,"hasSentences":false,"name":"id","textual":false},{"hasParagraphs":false,"hasSentences":false,"name":"slugline","textual":false},{"hasParagraphs":false,"hasSentences":false,"name":"versionCreated","textual":false,"date":true}],"language":"english","name":"Reuters Schema"},
"documents_file" : "corpora/reuters-documents.json"
}
]
},
{
"name": "IPTC Media Topics",
"language": "german",
"topics_file" : "topics/IPTC-Media-Topics-german.txt",
"rules_file":"rules/IPTC-Media-Topics-german.txt",
"corpora": [
{
"corpus_name": "APA",
"language": "german",
"schema":{"fields":[{"hasParagraphs":false,"hasSentences":true,"name":"title","textual":true},{"hasParagraphs":false,"hasSentences":true,"name":"subtitle","textual":true},{"hasParagraphs":true,"hasSentences":true,"name":"body","textual":true},{"hasParagraphs":false,"hasSentences":false,"name":"id","textual":false},{"hasParagraphs":false,"hasSentences":false,"name":"slugline","textual":false},{"hasParagraphs":false,"hasSentences":false,"name":"versionCreated","textual":false,"date":true}],"language":"german","name":"Apa Schema"},
"documents_file" : "corpora/apa-documents.json"
}
]
}
]
}