cml-props.txt 671 Bytes
Newer Older
priyank's avatar
priyank committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48
#SSF properties

encoding	UTF-8
rootName	SSF
chunkStart	((
chunkEnd	))
#fieldSeparatorRegex	\s+
fieldSeparatorRegex	\t
fieldSeparatorPrint	\t
sentenceStart	<Sentence
sentenceEnd	</Sentence

metaDataStart	<header
metaDataEnd	</header

textStart	<text
textEnd	</text

documentStart	<document
documentEnd	</document

storyStart	<body
storyEnd	</body

paragraphStart	<tb
paragraphEnd	</tb

#Document	document
#Attributes: docid, docnumber

#Body	body
#Body will replace story

#Paragraph	p
#Segment	segment
#Attributes: segmentnumber

#Sentence	sentence
#Attributes: sentencenumber

#Foreign	foreign

wordTagSeparator	_
unknownTag	UNK

bracketFormStart	[[
bracketFormEnd	]]