Safe Haskell | None |
---|
Morphosyntax data layer in Polish.
- type Tag = Text
- data Seg t = Seg {}
- data Word = Word {}
- data Interp t = Interp {}
- data Space
- type Sent t = [Seg t]
- data SentO t = SentO {}
- restore :: Sent t -> Text
- withOrig :: Sent t -> SentO t
- packSegTag :: Tagset -> Seg Tag -> Seg Word Tag
- packSeg :: Ord a => Seg a -> Seg Word a
- packSentTag :: Tagset -> Sent Tag -> Sent Word Tag
- packSentTagO :: Tagset -> SentO Tag -> SentO Word Tag
- packSent :: Ord a => Sent a -> Sent Word a
- embedSent :: Ord a => Sent a -> [a] -> Sent a
Tag
Segment
A segment.
A word.
No space, space or newline. TODO: Perhaps we should use a bit more informative data type.
Sentence
restore :: Sent t -> TextSource
Restore textual representation of a sentence. The function is not very accurate, it could be improved if we enrich representation of a space.
Conversion
packSegTag :: Tagset -> Seg Tag -> Seg Word TagSource
Convert a segment to a segment from a core library.
packSentTag :: Tagset -> Sent Tag -> Sent Word TagSource
Convert a sentence to a sentence from a core library.
packSentTagO :: Tagset -> SentO Tag -> SentO Word TagSource
Convert a sentence to a sentence from a core library.