ssf-props.txt.bak 860 Bytes
Newer Older
priyank's avatar
priyank committed
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51
#SSF properties

encoding	UTF-8
rootName	SSF
chunkStart	((
chunkEnd	))
fieldSeparatorRegex	\s+
fieldSeparatorPrint	\t
#sentenceStart	^<sentence|<Sentence|<s>
#sentenceEnd	^<\/sentence|<\/Sentence>|<\/s>
sentenceStart	<Sentence
sentenceEnd	</Sentence

#metaDataStart	^<meta
#metaDataEnd	^</meta
metaDataStart	<Meta
metaDataEnd	</Meta

#textStart	^<Text
#textEnd	^<\/Text>
textStart	<Text
textEnd	</Text

#storyStart	^<document|<Document|<Story
#storyEnd	^<\/document|<\/Document|<\/Story
storyStart	<Story
storyEnd	</Story

#Document	document
#Attributes: docid, docnumber

#Body	body
#Body will replace story

#Paragraph	p
#Segment	segment
#Attributes: segmentnumber

#Sentence	sentence
#Attributes: sentencenumber

#Foreign	foreign

wordTagSeparator	_
unknownTag	UNK

#bracketFormStart	^\s+\[\[
#bracketFormEnd	\]\]\s+$
bracketFormStart	[[
bracketFormEnd	]]