##
## registry entry for corpus REUTERS
##

# long descriptive name for the corpus
NAME "Reuters Sample Corpus"
# corpus ID (must be lowercase in registry!)
ID   reuters
# path to binary data files
HOME /PATH/TO/INDEXED/CORPUS/DIR/reuters
# optional info file (displayed by "info;" command in CQP)
INFO /PATH/TO/INDEXED/CORPUS/DIR/.info.md

# corpus properties provide additional information about the corpus:
##:: charset = "latin1"	# character encoding of corpus data
##:: language = "en"	# insert ISO code for language (de, en, fr, ...)
#========================================================================#


##
## p-attributes (token annotations)
##

ATTRIBUTE word
STRUCTURE id
STRUCTURE topics_cat
STRUCTURE places
STRUCTURE language
