pandoc-2.1: Conversion between markup formats

CopyrightCopyright (C) 2006-2018 John MacFarlane
LicenseGNU GPL, version 2 or above
MaintainerJohn MacFarlane <jgm@berkeley.edu>
Stabilityalpha
Portabilityportable
Safe HaskellNone
LanguageHaskell98

Text.Pandoc.Shared

Contents

Description

Utility functions and definitions used by the various Pandoc modules.

Synopsis

List processing

splitBy :: (a -> Bool) -> [a] -> [[a]] Source #

Split list by groups of one or more sep.

splitByIndices :: [Int] -> [a] -> [[a]] Source #

splitStringByIndices :: [Int] -> [Char] -> [[Char]] Source #

Split string into chunks divided at specified indices.

substitute :: Eq a => [a] -> [a] -> [a] -> [a] Source #

Replace each occurrence of one sublist in a list with another.

ordNub :: Ord a => [a] -> [a] Source #

Text processing

backslashEscapes Source #

Arguments

:: [Char]

list of special characters to escape

-> [(Char, String)] 

Returns an association list of backslash escapes for the designated characters.

escapeStringUsing :: [(Char, String)] -> String -> String Source #

Escape a string of characters, using an association list of characters and strings.

stripTrailingNewlines :: String -> String Source #

Strip trailing newlines from string.

trim :: String -> String Source #

Remove leading and trailing space (including newlines) from string.

triml :: String -> String Source #

Remove leading space (including newlines) from string.

trimr :: String -> String Source #

Remove trailing space (including newlines) from string.

stripFirstAndLast :: String -> String Source #

Strip leading and trailing characters from string

camelCaseToHyphenated :: String -> String Source #

Change CamelCase word to hyphenated lowercase (e.g., camel-case).

toRomanNumeral :: Int -> String Source #

Convert number < 4000 to uppercase roman numeral.

escapeURI :: String -> String Source #

Escape whitespace and some punctuation characters in URI.

tabFilter Source #

Arguments

:: Int

Tab stop

-> Text

Input

-> Text 

Convert tabs to spaces. Tabs will be preserved if tab stop is set to 0.

crFilter :: Text -> Text Source #

Strip out DOS line endings.

Date/time

normalizeDate :: String -> Maybe String Source #

Parse a date and convert (if possible) to YYYY-MM-DD format. We limit years to the range 1601-9999 (ISO 8601 accepts greater than or equal to 1583, but MS Word only accepts dates starting 1601).

Pandoc block and inline list processing

orderedListMarkers :: (Int, ListNumberStyle, ListNumberDelim) -> [String] Source #

Generate infinite lazy list of markers for an ordered list, depending on list attributes.

extractSpaces :: (Inlines -> Inlines) -> Inlines -> Inlines Source #

Extract the leading and trailing spaces from inside an inline element and place them outside the element. SoftBreaks count as Spaces for these purposes.

removeFormatting :: Walkable Inline a => a -> [Inline] Source #

Extract inlines, removing formatting.

stringify :: Walkable Inline a => a -> String Source #

Convert pandoc structure to a string with formatting removed. Footnotes are skipped (since we don't want their contents in link labels).

capitalize :: Walkable Inline a => a -> a Source #

Bring all regular text in a pandoc structure to uppercase.

This function correctly handles cases where a lowercase character doesn't match to a single uppercase character – e.g. “Straße” would be converted to “STRASSE”, not “STRAßE”.

compactify Source #

Arguments

:: [Blocks]

List of list items (each a list of blocks)

-> [Blocks] 

Change final list item from Para to Plain if the list contains no other Para blocks. Like compactify, but operates on Blocks rather than [Block].

compactifyDL :: [(Inlines, [Blocks])] -> [(Inlines, [Blocks])] Source #

Like compactify, but acts on items of definition lists.

linesToPara :: [[Inline]] -> Block Source #

Convert a list of lines into a paragraph with hard line breaks. This is useful e.g. for rudimentary support of LineBlock elements in writers.

data Element Source #

Data structure for defining hierarchical Pandoc documents

Constructors

Blk Block 
Sec Int [Int] Attr [Inline] [Element] 

Instances

Eq Element Source # 

Methods

(==) :: Element -> Element -> Bool #

(/=) :: Element -> Element -> Bool #

Data Element Source # 

Methods

gfoldl :: (forall d b. Data d => c (d -> b) -> d -> c b) -> (forall g. g -> c g) -> Element -> c Element #

gunfold :: (forall b r. Data b => c (b -> r) -> c r) -> (forall r. r -> c r) -> Constr -> c Element #

toConstr :: Element -> Constr #

dataTypeOf :: Element -> DataType #

dataCast1 :: Typeable (* -> *) t => (forall d. Data d => c (t d)) -> Maybe (c Element) #

dataCast2 :: Typeable (* -> * -> *) t => (forall d e. (Data d, Data e) => c (t d e)) -> Maybe (c Element) #

gmapT :: (forall b. Data b => b -> b) -> Element -> Element #

gmapQl :: (r -> r' -> r) -> r -> (forall d. Data d => d -> r') -> Element -> r #

gmapQr :: (r' -> r -> r) -> r -> (forall d. Data d => d -> r') -> Element -> r #

gmapQ :: (forall d. Data d => d -> u) -> Element -> [u] #

gmapQi :: Int -> (forall d. Data d => d -> u) -> Element -> u #

gmapM :: Monad m => (forall d. Data d => d -> m d) -> Element -> m Element #

gmapMp :: MonadPlus m => (forall d. Data d => d -> m d) -> Element -> m Element #

gmapMo :: MonadPlus m => (forall d. Data d => d -> m d) -> Element -> m Element #

Read Element Source # 
Show Element Source # 
Walkable Block Element Source # 

Methods

walk :: (Block -> Block) -> Element -> Element #

walkM :: (Monad m, Applicative m, Functor m) => (Block -> m Block) -> Element -> m Element #

query :: Monoid c => (Block -> c) -> Element -> c #

Walkable Inline Element Source # 

Methods

walk :: (Inline -> Inline) -> Element -> Element #

walkM :: (Monad m, Applicative m, Functor m) => (Inline -> m Inline) -> Element -> m Element #

query :: Monoid c => (Inline -> c) -> Element -> c #

hierarchicalize :: [Block] -> [Element] Source #

Convert list of Pandoc blocks into (hierarchical) list of Elements

uniqueIdent :: [Inline] -> Set String -> String Source #

Generate a unique identifier from a list of inlines. Second argument is a list of already used identifiers.

inlineListToIdentifier :: [Inline] -> String Source #

Convert Pandoc inline list to plain text identifier. HTML identifiers must start with a letter, and may contain only letters, digits, and the characters _-.

isHeaderBlock :: Block -> Bool Source #

True if block is a Header block.

headerShift :: Int -> Pandoc -> Pandoc Source #

Shift header levels up or down.

stripEmptyParagraphs :: Pandoc -> Pandoc Source #

Remove empty paragraphs.

isTightList :: [[Block]] -> Bool Source #

Detect if a list is tight.

addMetaField :: ToMetaValue a => String -> a -> Meta -> Meta Source #

Set a field of a Meta object. If the field already has a value, convert it into a list with the new value appended to the old value(s).

makeMeta :: [Inline] -> [[Inline]] -> [Inline] -> Meta Source #

Create Meta from old-style title, authors, date. This is provided to ease the transition from the old API.

eastAsianLineBreakFilter :: Pandoc -> Pandoc Source #

Remove soft breaks between East Asian characters.

underlineSpan :: Inlines -> Inlines Source #

Builder for underline. This probably belongs in Builder.hs in pandoc-types. Will be replaced once Underline is an element.

TagSoup HTML handling

renderTags' :: [Tag String] -> String Source #

Render HTML tags.

File handling

inDirectory :: FilePath -> IO a -> IO a Source #

Perform an IO action in a directory, returning to starting directory.

collapseFilePath :: FilePath -> FilePath Source #

Remove intermediate "." and ".." directories from a path.

collapseFilePath "./foo" == "foo"
collapseFilePath "/bar/../baz" == "/baz"
collapseFilePath "/../baz" == "/../baz"
collapseFilePath "parent/foo/baz/../bar" ==  "parent/foo/bar"
collapseFilePath "parent/foo/baz/../../bar" ==  "parent/bar"
collapseFilePath "parent/foo/.." ==  "parent"
collapseFilePath "/parent/foo/../../bar" ==  "/bar"

URI handling

schemes :: Set String Source #

Schemes from http://www.iana.org/assignments/uri-schemes.html plus the unofficial schemes doi, javascript, isbn, pmid.

isURI :: String -> Bool Source #

Check if the string is a valid URL with a IANA or frequently used but unofficial scheme (see schemes).

Error handling

mapLeft :: (a -> b) -> Either a c -> Either b c Source #

for squashing blocks

Safe read

safeRead :: (MonadPlus m, Read a) => String -> m a Source #

Temp directory

withTempDir :: String -> (FilePath -> IO a) -> IO a Source #

Version

pandocVersion :: String Source #

Version number of pandoc library.