From 1ac5768b14abd308b9c4755275fb17819903db3d Mon Sep 17 00:00:00 2001
From: Alexander Nozik <altavir@gmail.com>
Date: Sat, 4 Nov 2023 16:57:34 +0300
Subject: [PATCH] Add pandoc wrapper

---
 settings.gradle.kts                           |    3 +-
 snark-pandoc/README.md                        |   66 +
 snark-pandoc/build.gradle.kts                 |   20 +
 .../space/kscience/snark/pandoc/Pandoc.kt     |   69 +
 .../snark/pandoc/PandocCommandBuilder.kt      | 1239 +++++++++++++++++
 .../kscience/snark/pandoc/PandocInstaller.kt  |  264 ++++
 .../kscience/snark/pandoc/ResponseDto.kt      |   34 +
 .../jvmMain/resources/installer.properties    |    8 +
 snark-pandoc/src/jvmTest/kotlin/PandocTest.kt |  111 ++
 snark-pandoc/testing_directory/first_test.md  |   15 +
 snark-pandoc/testing_directory/simple.txt     |    1 +
 11 files changed, 1829 insertions(+), 1 deletion(-)
 create mode 100644 snark-pandoc/README.md
 create mode 100644 snark-pandoc/build.gradle.kts
 create mode 100644 snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/Pandoc.kt
 create mode 100644 snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/PandocCommandBuilder.kt
 create mode 100644 snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/PandocInstaller.kt
 create mode 100644 snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/ResponseDto.kt
 create mode 100644 snark-pandoc/src/jvmMain/resources/installer.properties
 create mode 100644 snark-pandoc/src/jvmTest/kotlin/PandocTest.kt
 create mode 100644 snark-pandoc/testing_directory/first_test.md
 create mode 100644 snark-pandoc/testing_directory/simple.txt

diff --git a/settings.gradle.kts b/settings.gradle.kts
index 87d8990..04380ea 100644
--- a/settings.gradle.kts
+++ b/settings.gradle.kts
@@ -41,5 +41,6 @@ include(
     ":snark-gradle-plugin",
     ":snark-core",
     ":snark-html",
-    ":snark-ktor"
+    ":snark-ktor",
+    ":snark-pandoc"
 )
\ No newline at end of file
diff --git a/snark-pandoc/README.md b/snark-pandoc/README.md
new file mode 100644
index 0000000..210974b
--- /dev/null
+++ b/snark-pandoc/README.md
@@ -0,0 +1,66 @@
+## Examples
+### Simple converting
+Convert from INPUT_FILE to OUTPUT_FILE:
+```java
+PandocWrapper wrapper = new PandocWrapper();
+wrapper.use(p -> {
+        var command = new PandocCommandBuilder(List.of(INPUT_FILE), OUTPUT_FILE);
+        PandocWrapper.execute(command);
+        });
+```
+Equal to:
+```
+pandoc --output=OUTPUT_FILE INPUT_FILE
+```
+### Convert and set formats
+Convert from INPUT_FILE to OUTPUT_FILE and set INPUT_FORMAT and OUTPUT_FORMAT:
+```java
+PandocWrapper wrapper = new PandocWrapper();
+wrapper.use(p -> {
+        var command = new PandocCommandBuilder(List.of(INPUT_FILE), OUTPUT_FILE);
+        command.formatForm(INPUT_FORMAT);
+        command.formatTo(OUTPUT_FORMAT);
+        PandocWrapper.execute(command);
+        });
+```
+Equal to:
+```
+pandoc --output=OUTPUT_FILE --from=INPUT_FORMAT --to=OUTPUT_FORMAT INPUT_FILE
+```
+### Converting with options
+Convert from INPUT_FILE to standalone OUTPUT_FILE and set variable KEY to VALUE :
+```java
+PandocWrapper wrapper = new PandocWrapper();
+wrapper.use(p -> {
+        var command = new PandocCommandBuilder(List.of(INPUT_FILE), OUTPUT_FILE);
+        command.standalone();
+        command.setVariable(KEY, VALUE);
+        PandocWrapper.execute(command);
+        });
+```
+Equal to:
+```
+pandoc --output=OUTPUT_FILE --standalone --variable=KEY:VALUE INPUT_FILE
+```
+
+### Write output from pandoc to file
+Receive possible input formats in OUTPUT_FILE:
+```java
+PandocWrapper wrapper = new PandocWrapper();
+wrapper.use(p -> {
+        var command = new PandocCommandBuilder();
+        command.getInputFormats();
+        PandocWrapper.execute(command, OUTPUT_FILE);
+        });
+```
+Then in OUTPUT_FILE will be a list supported input formats, one per line.
+
+### Write errors from pandoc to file
+Receive all from error stream and exit code in ERROR_FILE and output in OUTPUT_FILE:
+```java
+PandocWrapper wrapper = new PandocWrapper();
+wrapper.use(p -> {
+        var command = new PandocCommandBuilder(List.of(INPUT_FILE), OUTPUT_FILE);
+        PandocWrapper.execute(command, OUTPUT_FILE, ERROR_FILE);
+        });
+```
\ No newline at end of file
diff --git a/snark-pandoc/build.gradle.kts b/snark-pandoc/build.gradle.kts
new file mode 100644
index 0000000..a3ab2a4
--- /dev/null
+++ b/snark-pandoc/build.gradle.kts
@@ -0,0 +1,20 @@
+plugins {
+    id("space.kscience.gradle.mpp")
+}
+
+
+kscience {
+    useSerialization {
+        json()
+    }
+    jvm()
+    jvmMain {
+        api(spclibs.slf4j)
+        implementation("org.apache.commons:commons-exec:1.3")
+        implementation("org.apache.commons:commons-compress:1.2")
+    }
+    jvmTest{
+        implementation(spclibs.logback.classic)
+    }
+
+}
diff --git a/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/Pandoc.kt b/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/Pandoc.kt
new file mode 100644
index 0000000..7a0592d
--- /dev/null
+++ b/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/Pandoc.kt
@@ -0,0 +1,69 @@
+package space.kscience.snark.pandoc
+
+import org.slf4j.Logger
+import org.slf4j.LoggerFactory
+import java.io.BufferedReader
+import java.io.IOException
+import java.io.InputStreamReader
+import java.nio.file.Files
+import java.nio.file.Path
+import java.nio.file.StandardOpenOption
+import java.util.concurrent.TimeUnit
+import kotlin.io.path.Path
+
+public object Pandoc {
+    private val logger: Logger = LoggerFactory.getLogger(Pandoc::class.java)
+
+    private fun getOrInstallPandoc(pandocExecutablePath: Path): String = try {
+        ProcessBuilder("pandoc", "--version").start().waitFor()
+        "pandoc"
+    } catch (ex: IOException) {
+        if (Files.exists(pandocExecutablePath)) {
+            pandocExecutablePath.toAbsolutePath().toString()
+        } else {
+            logger.info("Pandoc not found in the system. Installing it from GitHub")
+            PandocInstaller.installPandoc(pandocExecutablePath).toAbsolutePath().toString()
+        }
+    }
+
+    /**
+     * Call pandoc with options described by commandBuilder.
+     * @param commandBuilder
+     * @return true if successfully false otherwise
+     */
+    public fun execute(
+        redirectOutput: Path? = null,
+        redirectError: Path? = null,
+        pandocExecutablePath: Path = Path("./pandoc").toAbsolutePath(),
+        commandBuilder: PandocCommandBuilder.() -> Unit,
+    ): Boolean {
+
+        val path = getOrInstallPandoc(pandocExecutablePath)
+
+        try {
+            val commandLine = PandocCommandBuilder().apply(commandBuilder).build(path)
+            logger.info("Running pandoc: ${commandLine.joinToString(separator = " ")}")
+            val pandoc = ProcessBuilder(commandLine).apply {
+                if(redirectOutput!= null){
+                    redirectOutput(redirectOutput.toFile())
+                }
+                if(redirectError !=null){
+                    redirectError(redirectError.toFile())
+                }
+
+            }.start()
+            pandoc.waitFor(1, TimeUnit.SECONDS)
+
+            if (pandoc.exitValue() == 0) {
+                logger.info("Successfully execute")
+                return true
+            } else{
+                return false
+            }
+        } catch (e: Exception) {
+            logger.error("Got problems with executing: " + e.message)
+            return false
+        }
+    }
+
+}
diff --git a/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/PandocCommandBuilder.kt b/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/PandocCommandBuilder.kt
new file mode 100644
index 0000000..b56200b
--- /dev/null
+++ b/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/PandocCommandBuilder.kt
@@ -0,0 +1,1239 @@
+package space.kscience.snark.pandoc
+
+import java.net.URL
+import java.nio.file.Path
+import java.util.*
+import kotlin.io.path.absolutePathString
+
+public class PandocCommandBuilder(
+    public var options: MutableList<String> = ArrayList(),
+    public var inputFiles: MutableList<Path> = ArrayList(),
+) {
+
+    /**
+     * @return commands to run `pandoc commands[]...`
+     */
+    public fun build(pandocPath: String): List<String> {
+        options.add(0, pandocPath)
+        if (inputFiles.isEmpty()) {
+            // case pandoc -v; etc
+            return options
+        }
+        for (file in inputFiles) {
+            options.add(file.absolutePathString())
+        }
+        return options
+    }
+
+    /**
+     * Specify input format
+     */
+    public fun formatFrom(format: String) {
+        options.add("--from=$format")
+
+    }
+
+    /**
+     * Specify output format
+     */
+    public fun formatTo(format: String) {
+        options.add("--to=$format")
+
+    }
+
+    public fun addInputFile(file: Path) {
+        inputFiles.add(file)
+    }
+
+    /**
+     * Set file output. Without it output == stdout
+     */
+    public fun outputFile(outputFile: Path) {
+        options.add("--output=${outputFile.absolutePathString()}")
+    }
+
+    /**
+     * Specify the user data directory to search for pandoc data files. If this option is not specified, the default
+     * user data directory will be used. On *nix and macOS systems this will be the pandoc subdirectory of the XDG
+     * data directory (by default, $HOME/.local/share, overridable by setting the XDG_DATA_HOME environment variable).
+     * If that directory does not exist and $HOME/.pandoc exists, it will be used (for backwards compatibility).
+     * On Windows the default user data directory is %APPDATA%\pandoc. You can find the default user data directory on
+     * your system by looking at the output of pandoc --version. Data files placed in this directory
+     * (for example, reference.odt, reference.docx, epub.css, templates) will override pandoc’s normal defaults.
+     */
+    public fun dataDir(dataDir: Path) {
+        options.add("--data-dir=" + dataDir.toAbsolutePath())
+
+    }
+
+    /**
+     * Specify a set of default option settings. file is a YAML file whose fields correspond to command-line option
+     * settings. All options for document conversion, including input and output files, can be set using a defaults file.
+     * The file will be searched for first in the working directory, and then in the defaults subdirectory of the user
+     * data directory (see PandocOptionsBuilder#dataDir). The .yaml extension may be omitted.
+     * Settings from the defaults file may be overridden or extended by subsequent options on the command line.
+     */
+    public fun defaultSettings(file: Path) {
+        options.add("--defaults=$file")
+
+    }
+
+    /**
+     * Generate a bash completion script. To enable bash completion with pandoc, add this to your .bashrc:
+     * eval "$(pandoc --bash-completion)"
+     */
+    public fun bashCompletion() {
+        options.add("--bash-completion")
+
+    }
+
+    /**
+     * Give verbose debugging output.
+     */
+    public fun verbose() {
+        options.add("--verbose")
+
+    }
+
+    /**
+     * Suppress warning messages.
+     */
+    public fun quiet() {
+        options.add("--quiet")
+
+    }
+
+    /**
+     * Exit with error status if there are any warnings.
+     */
+    public fun fallIfWarnings() {
+        options.add("--fail-if-warnings")
+
+    }
+
+    /**
+     * Write log messages in machine-readable JSON format to file. All messages above DEBUG level will be written,
+     * regardless of verbosity settings (--verbose, --quiet).
+     * @param file
+     */
+    public fun logFile(file: Path) {
+        options.add("--log=$file")
+
+    }
+
+    /**
+     * List supported input formats, one per line.
+     */
+
+    public fun getInputFormats() {
+        options.add("--list-input-formats")
+    }
+
+    public fun getOutputFormats() {
+        options.add("--list-output-formats")
+    }
+
+    /**
+     * List supported extensions for format, one per line, preceded by a + or - indicating whether it is enabled by
+     * default in format. If FORMAT is not specified, defaults for pandoc’s Markdown are given.
+     * @param format
+     */
+    public fun getExtensions(format: String?) {
+        if (format == null) {
+            options.add("--list-extensions")
+        } else {
+            options.add("--list-extensions=$format")
+        }
+
+    }
+
+    public fun getHighlightLanguages() {
+        options.add("--list-highlight-languages")
+    }
+
+    public fun getHighlightStyles() {
+        options.add("--list-highlight-styles")
+    }
+
+    public fun getVersion() {
+        options.add("--version")
+    }
+
+    /**
+     * Show the usage message.
+     */
+    public fun help() {
+        options.add("--help")
+
+    }
+
+    /**
+     * Shift heading levels by a positive or negative integer. For example, with --shift-heading-level-by=-1, level 2
+     * headings become level 1 headings, and level 3 headings become level 2 headings. Headings cannot have a level less
+     * than 1, so a heading that would be shifted below level 1 becomes a regular paragraph.
+     * Exception: with a shift of -N, a level-N heading at the beginning of the document replaces the metadata title.
+     * --shift-heading-level-by=-1 is a good choice when converting HTML or Markdown documents
+     * that use an initial level-1 heading for the document title and level-2+ headings for sections.
+     * --shift-heading-level-by=1 may be a good choice for converting Markdown documents that use level-1 headings for
+     * sections to HTML, since pandoc uses a level-1 heading to render the document title.
+     */
+    public fun shiftHeadingLevelBy(number: Int) {
+        options.add("--shift-heading-level-by=$number")
+
+    }
+
+    /**
+     * Specify classes to use for indented code blocks–for example, perl,numberLines or haskell.
+     * Multiple classes may be separated by spaces or commas.
+     */
+    public fun indentedCodeClasses(classes: String) {
+        options.add("--indented-code-classes=$classes")
+
+    }
+
+    /**
+     * Specify a default extension to use when image paths/URLs have no extension. This allows you to use
+     * the same source for formats that require different kinds of images.
+     * Currently, this option only affects the Markdown and LaTeX readers.
+     */
+    public fun defaultImageExtension(extension: String) {
+        options.add("--default-image-extension=$extension")
+
+    }
+
+    /**
+     * Parse each file individually before combining for multifile documents. This will allow footnotes in different
+     * files with the same identifiers to work as expected. If this option is set, footnotes and links will not
+     * work across files. Reading binary files (docx, odt, epub) implies --file-scope.
+     * If two or more files are processed using --file-scope, prefixes based on the filenames will be added to
+     * identifiers in order to disambiguate them, and internal links will be adjusted accordingly. For example,
+     * a header with identifier foo in subdir/file1.txt will have its identifier changed to subdir__file1.txt__foo.
+     * In addition, a Div with an identifier based on the filename will be added around the file’s content,
+     * so that internal links to the filename will point to this Div’s identifier.
+     */
+    public fun fileScope() {
+        options.add("--file-scope")
+
+    }
+
+    /**
+     * Specify an executable to be used as a filter transforming the pandoc AST after the input is parsed and before
+     * the output is written. The executable should read JSON from stdin and write JSON to stdout. The JSON must be
+     * formatted like pandoc’s own JSON input and output. The name of the output format will be passed to the filter
+     * as the first argument. Hence,
+     * pandoc --filter ./caps.py -t latex
+     * is equivalent to
+     * pandoc -t json | ./caps.py latex | pandoc -f json -t latex
+     * The latter form may be useful for debugging filters.
+     * Filters may be written in any language. Text.Pandoc.JSON exports toJSONFilter to facilitate writing filters
+     * in Haskell. Those who would prefer to write filters in python can use the module pandocfilters,
+     * installable from PyPI. There are also pandoc filter libraries in PHP, perl, and JavaScript/node.js.
+     * In order of preference, pandoc will look for filters in
+     * 1. a specified full or relative path (executable or non-executable),
+     * 2. $DATADIR/filters (executable or non-executable) where $DATADIR is the user data directory (see --data-dir, above),
+     * 3. $PATH (executable only).
+     * Filters, Lua-filters, and citeproc processing are applied in the order specified on the command line.
+     */
+    public fun filter(program: Path) {
+        options.add("-F $program")
+
+    }
+
+    /**
+     * Transform the document in a similar fashion as JSON filters (see --filter), but use pandoc’s built-in Lua
+     * filtering system. The given Lua script is expected to return a list of Lua filters which will be applied in order.
+     * Each Lua filter must contain element-transforming functions indexed by the name of the AST element on which the
+     * filter function should be applied.
+     * The pandoc Lua module provides helper functions for element creation.
+     * It is always loaded into the script’s Lua environment.
+     * See the Lua filters documentation for further details.
+     * In order of preference, pandoc will look for Lua filters in
+     * 1. a specified full or relative path,
+     * 2. $DATADIR/filters where $DATADIR is the user data directory (see --data-dir, above).
+     * Filters, Lua filters, and citeproc processing are applied in the order specified on the command line.
+     */
+    public fun luaFilter(program: Path) {
+        options.add("-L $program")
+
+    }
+
+    /**
+     * Set the metadata field KEY to the value VAL. A value specified on the command line overrides a value specified in
+     * the document using YAML metadata blocks. Values will be parsed as YAML boolean or string values. If no value is
+     * specified, the value will be treated as Boolean true. Like --variable, --metadata causes template variables
+     * to be set. But unlike --variable, --metadata affects the metadata of the underlying document (which is accessible
+     * from filters and may be printed in some output formats) and metadata values will be escaped
+     * when inserted into the template.
+     */
+    public fun metadata(key: String, value: String?) {
+        if (value == null) {
+            options.add("--metadata=$key")
+
+        }
+        options.add("--metadata=$key:$value")
+
+    }
+
+    /**
+     * Read metadata from the supplied YAML (or JSON) file. This option can be used with every input format, but string
+     * scalars in the metadata file will always be parsed as Markdown. (If the input format is Markdown or a Markdown
+     * variant, then the same variant will be used to parse the metadata file; if it is a non-Markdown format, pandoc’s
+     * default Markdown extensions will be used.) This option can be used repeatedly to include multiple metadata files;
+     * values in files specified later on the command line will be preferred over those specified in earlier files.
+     * Metadata values specified inside the document, or by using -M, overwrite values specified with this option.
+     * The file will be searched for first in the working directory, and then in the metadata subdirectory of the user
+     * data directory (see --data-dir).
+     */
+    public fun metadataFile(file: Path) {
+        options.add("--metadata-file=$file")
+
+    }
+
+    /**
+     * Preserve tabs instead of converting them to spaces. (By default, pandoc converts tabs to spaces before parsing
+     * its input.) Note that this will only affect tabs in literal code spans and code blocks.
+     * Tabs in regular text are always treated as spaces.
+     */
+    public fun preserveTabs() {
+        options.add("--preserve-tabs")
+
+    }
+
+    /**
+     * Specify the number of spaces per tab (default is 4).
+     */
+    public fun tabStop(number: Int) {
+        options.add("--tab-stop=$number")
+
+    }
+
+    /**
+     * Specifies what to do with insertions, deletions, and comments produced by the MS Word “Track Changes” feature.
+     * accept (the default) processes all the insertions and deletions. reject ignores them. Both accept and reject
+     * ignore comments. all includes all insertions, deletions, and comments, wrapped in spans with insertion, deletion,
+     * comment-start, and comment-end classes, respectively. The author and time of change is included. all is useful
+     * for scripting: only accepting changes from a certain reviewer, say, or before a certain date. If a paragraph is
+     * inserted or deleted, track-changes=all produces a span with the class paragraph-insertion/paragraph-deletion
+     * before the affected paragraph break. This option only affects the docx reader.
+     */
+    public fun trackChanges(option: String) {
+        options.add("--track-changes=$option")
+
+    }
+
+    /**
+     * Extract images and other media contained in or linked from the source document to the path DIR, creating it
+     * if necessary, and adjust the images references in the document so they point to the extracted files. Media are
+     * downloaded, read from the file system, or extracted from a binary container (e.g. docx), as needed.
+     * The original file paths are used if they are relative paths not containing ...
+     * Otherwise, filenames are constructed from the SHA1 hash of the contents.
+     */
+    public fun extractMediaDirectory(dir: Path) {
+        options.add("--extract-media=$dir")
+
+    }
+
+    /**
+     * Specifies a custom abbreviations file, with abbreviations one to a line. If this option is not specified, pandoc
+     * will read the data file abbreviations from the user data directory or fall back on a system default.
+     * To see the system default, use pandoc --print-default-data-file=abbreviations. The only use pandoc makes of this
+     * list is in the Markdown reader. Strings found in this list will be followed by a nonbreaking space, and
+     * the period will not produce sentence-ending space in formats like LaTeX. The strings may not contain spaces.
+     */
+    public fun abbreviationsFile(file: Path) {
+        options.add("--abbreviations=$file")
+
+    }
+
+    /**
+     * Print diagnostic output tracing parser progress to stderr. This option is intended for use by developers
+     * in diagnosing performance issues.
+     */
+    public fun trace() {
+        options.add("--trace")
+
+    }
+
+    /**
+     * Produce output with an appropriate header and footer (e.g. a standalone HTML, LaTeX, TEI, or RTF file,
+     * not a fragment). This option is set automatically for pdf, epub, epub3, fb2, docx, and odt output.
+     * For native output, this option causes metadata to be included; otherwise, metadata is suppressed.
+     */
+    public fun standalone() {
+        options.add("--standalone")
+
+    }
+
+    /**
+     * Use the specified file as a custom template for the generated document. Implies --standalone. See Templates,
+     * below, for a description of template syntax. If no extension is specified, an extension corresponding to
+     * the writer will be added, so that --template=special looks for special.html for HTML output. If the template
+     * is not found, pandoc will search for it in the templates subdirectory of the user data directory (see --data-dir).
+     * If this option is not used, a default template appropriate for the output format will be used
+     * (see -D/--print-default-template).
+     */
+    public fun setTemplate(file: Path) {
+        options.add("--template=$file")
+
+    }
+
+    public fun setTemplate(url: URL) {
+        options.add("--template=$url")
+
+    }
+
+    /**
+     * Set the template variable KEY to the value VAL when rendering the document in standalone mode.
+     * If no VAL is specified, the key will be given the value true.
+     */
+    public fun setVariable(key: String, variable: String?) {
+        if (variable == null) {
+            options.add("--variable=$key")
+
+        }
+        options.add("--variable=$key:$variable")
+
+    }
+
+    /**
+     * Run pandoc in a sandbox, limiting IO operations in readers and writers to reading the files specified on
+     * the command line. Note that this option does not limit IO operations by filters or in the production of PDF
+     * documents. But it does offer security against, for example, disclosure of files through the use of include
+     * directives. Anyone using pandoc on untrusted user input should use this option.
+     * Note: some readers and writers (e.g., docx) need access to data files. If these are stored on the file system,
+     * then pandoc will not be able to find them when run in --sandbox mode and will raise an error.
+     * For these applications, we recommend using a pandoc binary compiled with the embed_data_files option,
+     * which causes the data files to be baked into the binary instead of being stored on the file system
+     */
+    public fun sandbox() {
+        options.add("--sandbox")
+
+    }
+
+    /**
+     * Print the system default template for an output FORMAT. (See -t for a list of possible FORMATs.) Templates
+     * in the user data directory are ignored. This option may be used with -o/--output to redirect output to a file,
+     * but -o/--output must come before --print-default-template on the command line.
+     * Note that some of the default templates use partials, for example styles.html. To print the partials,
+     * use --print-default-data-file: for example, --print-default-data-file=templates/styles.html.
+     */
+    public fun printDefaultFormat(format: String) {
+        options.add("--print-default-template=$format")
+
+    }
+
+    /**
+     * Print a system default data file. Files in the user data directory are ignored. This option may be used with
+     * -o/--output to redirect output to a file, but -o/--output must come before --print-default-data-file
+     * on the command line.
+     */
+    public fun printDefaultDataFile(file: Path) {
+        options.add("--print-default-data-file=$file")
+
+    }
+
+    /**
+     * Manually specify line endings: crlf (Windows), lf (macOS/Linux/UNIX), or native (line endings appropriate
+     * to the OS on which pandoc is being run). The default is native.
+     */
+    public fun setLineEndings(option: String) {
+        options.add("--eol=$option")
+
+    }
+
+    /**
+     * Specify the default dpi (dots per inch) value for conversion from pixels to inch/centimeters and vice versa.
+     * (Technically, the correct term would be ppi: pixels per inch.) The default is 96dpi. When images contain
+     * information about dpi internally, the encoded value is used instead of the default specified by this option.
+     */
+    public fun setDotsPerInch(number: Int) {
+        options.add("--dpi=$number")
+
+    }
+
+    /**
+     * Determine how text is wrapped in the output (the source code, not the rendered version). With auto (the default),
+     * pandoc will attempt to wrap lines to the column width specified by --columns (default 72). With none,
+     * pandoc will not wrap lines at all. With preserve, pandoc will attempt to preserve the wrapping from the source
+     * document (that is, where there are nonsemantic newlines in the source, there will be nonsemantic newlines
+     * in the output as well). In ipynb output, this option affects wrapping of the contents of markdown cells.
+     */
+    public fun wrapStrategy(strategy: String) {
+        options.add("--wrap=$strategy")
+
+    }
+
+    /**
+     * Specify length of lines in characters. This affects text wrapping in the generated source code (see --wrap).
+     * It also affects calculation of column widths for plain text tables (see Tables below).
+     */
+    public fun lengthOfLines(number: Int) {
+        options.add("--columns=$number")
+
+    }
+
+    /**
+     * Include an automatically generated table of contents (or, in the case of latex, context, docx, odt, opendocument,
+     * rst, or ms, an instruction to create one) in the output document. This option has no effect unless
+     * -s/--standalone is used, and it has no effect on man, docbook4, docbook5, or jats output.
+     * Note that if you are producing a PDF via ms, the table of contents will appear at the beginning of the document,
+     * before the title. If you would prefer it to be at the end of the document, use the option
+     * --pdf-engine-opt=--no-toc-relocation.
+     */
+    public fun addTable() {
+        options.add("--table-of-contents")
+
+    }
+
+    /**
+     * Specify the number of section levels to include in the table of contents. The default is 3
+     * (which means that level-1, 2, and 3 headings will be listed in the contents).
+     */
+    public fun setTableLevels(numb: Int) {
+        options.add("--toc-depth=$numb")
+
+    }
+
+    /**
+     * Strip out HTML comments in the Markdown or Textile source, rather than passing them on to Markdown, Textile or
+     * HTML output as raw HTML. This does not apply to HTML comments inside raw HTML blocks
+     * when the markdown_in_html_blocks extension is not set.
+     */
+    public fun stripComments() {
+        options.add("--strip-comments")
+
+    }
+
+    /**
+     * Disables syntax highlighting for code blocks and inlines, even when a language attribute is given.
+     */
+    public fun disableHighlight() {
+        options.add("--no-highlight")
+
+    }
+
+    /**
+     * Specifies the coloring style to be used in highlighted source code. Options are pygments (the default),
+     * kate, monochrome, breezeDark, espresso, zenburn, haddock, and tango. For more information on syntax highlighting
+     * in pandoc, see Syntax highlighting, below. See also --list-highlight-styles.
+     * To generate the JSON version of an existing style, use --print-highlight-style.
+     */
+    public fun highlightStyle(style: String) {
+        options.add("--highlight-style=$style")
+
+    }
+
+    /**
+     * Specifies the coloring style to be used in highlighted source code.
+     * Param is a JSON file with extension .theme. This will be parsed as a
+     * KDE syntax highlighting theme and (if valid) used as the highlighting style.
+     * To generate the JSON version of an existing style, use --print-highlight-style.
+     */
+    public fun highlightStyle(style: Path) {
+        options.add("--highlight-style=$style")
+
+    }
+
+    /**
+     * Prints a JSON version of a highlighting style, which can be modified, saved with a .theme extension, and
+     * used with --highlight-style. This option may be used with -o/--output to redirect output to a file,
+     * but -o/--output must come before --print-highlight-style on the command line.
+     */
+    public fun printHighlightStyle(style: String) {
+        options.add("--print-highlight-style=$style")
+
+    }
+
+    /**
+     * Prints a JSON version of a highlighting style, which can be modified, saved with a .theme extension, and
+     * used with --highlight-style. This option may be used with -o/--output to redirect output to a file,
+     * but -o/--output must come before --print-highlight-style on the command line.
+     */
+    public fun printHighlightStyle(file: Path) {
+        options.add("--print-highlight-style=$file")
+
+    }
+
+    /**
+     * Instructs pandoc to load a KDE XML syntax definition file, which will be used for syntax highlighting of
+     * appropriately marked code blocks. This can be used to add support for new languages or to use altered syntax
+     * definitions for existing languages. This option may be repeated to add multiple syntax definitions.
+     */
+    public fun syntaxDefinition(file: Path) {
+        options.add("--syntax-definition=$file")
+
+    }
+
+    /**
+     * Include contents of FILE, verbatim, at the end of the header. This can be used, for example, to include special
+     * CSS or JavaScript in HTML documents. This option can be used repeatedly to include multiple files in the header.
+     * They will be included in the order specified. Implies --standalone.
+     */
+    public fun includeInHeader(file: Path) {
+        options.add("--include-in-header=$file")
+
+    }
+
+    /**
+     * Include contents of FILE, verbatim, at the end of the header. This can be used, for example, to include special
+     * CSS or JavaScript in HTML documents. This option can be used repeatedly to include multiple files in the header.
+     * They will be included in the order specified. Implies --standalone.
+     */
+    public fun includeInHeader(url: URL) {
+        options.add("--include-in-header=$url")
+
+    }
+
+    /**
+     * Include contents of FILE, verbatim, at the beginning of the document body (e.g. after the <body> tag in HTML,
+     * or the \begin{document} command in LaTeX). This can be used to include navigation bars or
+     * banners in HTML documents. This option can be used repeatedly to include multiple files. They will be included
+     * in the order specified. Implies --standalone.
+    </body> */
+    public fun includeBeforeBody(file: Path) {
+        options.add("--include-before-body=$file")
+
+    }
+
+    /**
+     * Include contents of FILE, verbatim, at the beginning of the document body (e.g. after the <body> tag in HTML,
+     * or the \begin{document} command in LaTeX). This can be used to include navigation bars or
+     * banners in HTML documents. This option can be used repeatedly to include multiple files. They will be included
+     * in the order specified. Implies --standalone.
+    </body> */
+    public fun includeBeforeBody(url: URL) {
+        options.add("--include-before-body=$url")
+
+    }
+
+    /**
+     * Include contents of FILE, verbatim, at the end of the document body (before the  tag in HTML,
+     * or the \end{document} command in LaTeX). This option can be used repeatedly to include multiple files.
+     * They will be included in the order specified. Implies --standalone.
+     */
+    public fun includeAfterBody(file: Path) {
+        options.add("--include-after-body=$file")
+
+    }
+
+    /**
+     * Include contents of FILE, verbatim, at the end of the document body (before the  tag in HTML,
+     * or the \end{document} command in LaTeX). This option can be used repeatedly to include multiple files.
+     * They will be included in the order specified. Implies --standalone.
+     */
+    public fun includeAfterBody(url: URL) {
+        options.add("--include-after-body=$url")
+
+    }
+
+    /**
+     * List of paths to search for images and other resources. The paths should be separated by : on Linux, UNIX,
+     * and macOS systems, and by ; on Windows. If --resource-path is not specified, the default resource path
+     * is the working directory. Note that, if --resource-path is specified, the working directory must be
+     * explicitly listed or it will not be searched. For example: --resource-path=.:test will search the working
+     * directory and the test subdirectory, in that order. This option can be used repeatedly. Search path components
+     * that come later on the command line will be searched before those that come earlier, so --resource-path foo:bar
+     * --resource-path baz:bim is equivalent to --resource-path baz:bim:foo:bar.
+     */
+    public fun resourcePath(path: String) {
+        options.add("--resource-path=$path")
+
+    }
+
+    /**
+     * Set the request header NAME to the value VAL when making HTTP requests (for example, when a URL is given
+     * on the command line, or when resources used in a document must be downloaded). If you’re behind a proxy,
+     * you also need to set the environment variable http_proxy to http://....
+     */
+    public fun requestHeader(name: String, `val`: String) {
+        options.add("--request-header=$name:$`val`")
+
+    }
+
+    /**
+     * Disable the certificate verification to allow access to unsecure HTTP resources
+     * (for example when the certificate is no longer valid or self-signed).
+     */
+    public fun noCheckCertificate() {
+        options.add("--no-check-certificate")
+
+    }
+
+    /**
+     * Produce a standalone HTML file with no external dependencies, using data: URIs to incorporate the contents of
+     * linked scripts, stylesheets, images, and videos. The resulting file should be “self-contained,” in the sense
+     * that it needs no external files and no net access to be displayed properly by a browser. This option works only
+     * with HTML output formats, including html4, html5, html+lhs, html5+lhs, s5, slidy, slideous, dzslides, and
+     * revealjs. Scripts, images, and stylesheets at absolute URLs will be downloaded; those at relative URLs will be
+     * sought relative to the working directory (if the first source file is local) or relative to the base URL
+     * (if the first source file is remote). Elements with the attribute data-external="1" will be left alone;
+     * the documents they link to will not be incorporated in the document. Limitation: resources that are loaded
+     * dynamically through JavaScript cannot be incorporated; as a result, fonts may be missing when --mathjax is used,
+     * and some advanced features (e.g. zoom or speaker notes) may not work in an offline “self-contained” reveal.js
+     * slide show.
+     */
+    public fun embedResources() {
+        options.add("--embed-resources")
+
+    }
+
+    /**
+     * Use <q> tags for quotes in HTML.
+     * (This option only has an effect if the smart extension is enabled for the input format used.)
+    </q> */
+    public fun htmlQTags() {
+        options.add("--html-q-tags")
+
+    }
+
+    /**
+     * Use only ASCII characters in output. Currently supported for XML and HTML formats (which use entities instead of
+     * UTF-8 when this option is selected), CommonMark, gfm, and Markdown (which use entities), roff man and ms
+     * (which use hexadecimal escapes), and to a limited degree LaTeX
+     * (which uses standard commands for accented characters when possible).
+     */
+    public fun useAscii() {
+        options.add("--ascii")
+
+    }
+
+    /**
+     * Use reference-style links, rather than inline links, in writing Markdown or reStructuredText.
+     * By default, inline links are used.The placement of link references is affected by the --reference-location option
+     */
+    public fun referenceLinks() {
+        options.add("--reference-links")
+
+    }
+
+    /**
+     * Specify whether footnotes (and references, if reference-links is set) are placed at the end of the current
+     * (top-level) block, the current section, or the document. The default is document. Currently, this option only
+     * affects the markdown, muse, html, epub, slidy, s5, slideous, dzslides, and revealjs writers. In slide formats,
+     * specifying --reference-location=section will cause notes to be rendered at the bottom of a slide.
+     * @param option : block|section|document
+     */
+    public fun referenceLocation(option: String) {
+        options.add("--reference-location=$option")
+
+    }
+
+    /**
+     * Specify whether to use ATX-style (#-prefixed) or Setext-style (underlined) headings for level 1 and 2 headings
+     * in Markdown output. (The default is atx.) ATX-style headings are always used for levels 3+. This option also
+     * affects Markdown cells in ipynb output.
+     * @param option : setext|atx
+     */
+    public fun markdownHeadings(option: String) {
+        options.add("--markdown-headings=$option")
+
+    }
+
+    /**
+     * Render tables as list tables in RST output.
+     */
+    public fun listTables() {
+        options.add("--list-tables")
+
+    }
+
+    /**
+     * Treat top-level headings as the given division type in LaTeX, ConTeXt, DocBook, and TEI output. The hierarchy
+     * order is part, chapter, then section; all headings are shifted such that the top-level heading becomes
+     * the specified type. The default behavior is to determine the best division type via heuristics: unless other
+     * conditions apply, section is chosen. When the documentclass variable is set to report, book, or memoir
+     * (unless the article option is specified), chapter is implied as the setting for this option. If beamer is
+     * the output format, specifying either chapter or part will cause top-level headings to become \part{..},
+     * while second-level headings remain as their default type.
+     * @param option : default|section|chapter|part
+     */
+    public fun topLevelDivision(option: String) {
+        options.add("--top-level-division=$option")
+
+    }
+
+    /**
+     * Number section headings in LaTeX, ConTeXt, HTML, Docx, ms, or EPUB output. By default, sections are not numbered.
+     * Sections with class unnumbered will never be numbered, even if --number-sections is specified.
+     */
+    public fun numberSections() {
+        options.add("--number-sections")
+
+    }
+
+    /**
+     * Offset for section headings in HTML output (ignored in other output formats). The first number is added to the
+     * section number for top-level headings, the second for second-level headings, and so on. So, for example,
+     * if you want the first top-level heading in your document to be numbered “6”, specify --number-offset=5.
+     * If your document starts with a level-2 heading which you want to be numbered “1.5”, specify --number-offset=1,4.
+     * Offsets are 0 by default. Implies --number-sections.
+     * @param numbs
+     */
+    public fun numberOffset(numbs: List<Int>) {
+        if (numbs.isEmpty()) {
+
+        }
+        val sb = StringBuilder(numbs[0].toString())
+        if (numbs.size > 1) {
+            for (i in 1..<numbs.size) {
+                sb.append(",")
+                sb.append(numbs[i])
+            }
+        }
+        options.add("--number-offset=$sb")
+
+    }
+
+    /**
+     * Use the listings package for LaTeX code blocks. The package does not support multibyte encoding for source code.
+     * To handle UTF-8 you would need to use a custom template. This issue is fully documented here:
+     * See [
+ * Encoding issue with the listings package
+](https://en.wikibooks.org/wiki/LaTeX/Source_Code_Listings#Encoding_issue) *
+     */
+    public fun listings() {
+        options.add("--listings")
+
+    }
+
+    /**
+     * Make list items in slide shows display incrementally (one by one).
+     * The default is for lists to be displayed all at once.
+     */
+    public fun incremental() {
+        options.add("--incremental")
+
+    }
+
+    /**
+     * Specifies that headings with the specified level create slides (for beamer, s5, slidy, slideous, dzslides).
+     * Headings above this level in the hierarchy are used to divide the slide show into sections; headings below this
+     * level create subheads within a slide. Valid values are 0-6. If a slide level of 0 is specified,
+     * slides will not be split automatically on headings, and horizontal rules must be used to indicate
+     * slide boundaries. If a slide level is not specified explicitly, the slide level will be set automatically
+     * based on the contents of the document.
+     * See [Structuring the slide show.](https://pandoc.org/MANUAL.html#structuring-the-slide-show)
+     */
+    public fun slideLevel(number: Int) {
+        options.add("--slide-level=$number")
+
+    }
+
+    /**
+     * Wrap sections in <section> tags (or <div> tags for html4), and attach identifiers to the enclosing <section>
+     * (or <div>) rather than the heading itself.
+     * See [Heading identifiers](https://pandoc.org/MANUAL.html#heading-identifiers)
+     */
+    public fun sectionDivs() {
+        options.add("--section-divs")
+
+    }
+
+    /**
+     * Specify a method for obfuscating mailto: links in HTML documents. none leaves mailto: links as they are.
+     * javascript obfuscates them using JavaScript. references obfuscates them by printing their letters as decimal or
+     * hexadecimal character references. The default is none.
+     * @param option : none|javascript|references
+     */
+    public fun emailObfuscation(option: String) {
+        options.add("--email-obfuscation=$option")
+
+    }
+
+    /**
+     * Specify a prefix to be added to all identifiers and internal links in HTML and DocBook output, and to footnote
+     * numbers in Markdown and Haddock output. This is useful for preventing duplicate identifiers when generating
+     * fragments to be included in other pages.
+     */
+    public fun idPrefix(option: String) {
+        options.add("--id-prefix=$option")
+
+    }
+
+    /**
+     * Specify STRING as a prefix at the beginning of the title that appears in the HTML header (but not in the title
+     * as it appears at the beginning of the HTML body). Implies --standalone.
+     */
+    public fun titlePrefix(option: String) {
+        options.add("--title-prefix=$option")
+
+    }
+
+    /**
+     * Link to a CSS style sheet. This option can be used repeatedly to include multiple files. They will be included in
+     * the order specified. This option only affects HTML (including HTML slide shows) and EPUB output. It should be
+     * used together with -s/--standalone, because the link to the stylesheet goes in the document header.
+     * A stylesheet is required for generating EPUB. If none is provided using this option (or the css or stylesheet
+     * metadata fields), pandoc will look for a file epub.css in the user data directory (see --data-dir).
+     * If it is not found there, sensible defaults will be used.
+     */
+    public fun linkToCss(url: URL) {
+        options.add("--css=$url")
+
+    }
+
+    /**
+     * Use the specified file as a style reference in producing a docx or ODT file.
+     * See [ Options affecting specific writers](https://pandoc.org/MANUAL.html#options-affecting-specific-writers)
+     */
+    public fun referenceDoc(file: Path) {
+        options.add("--reference-doc=$file")
+
+    }
+
+    /**
+     * Use the specified file as a style reference in producing a docx or ODT file.
+     * See [
+ * Options affecting specific writers
+](https://pandoc.org/MANUAL.html#options-affecting-specific-writers) *
+     */
+    public fun referenceDoc(url: URL) {
+        options.add("--reference-doc=$url")
+
+    }
+
+    /**
+     * Specify the heading level at which to split an EPUB or chunked HTML document into separate files. The default is
+     * to split into chapters at level-1 headings. In the case of EPUB, this option only affects the internal
+     * composition of the EPUB, not the way chapters and sections are displayed to users. Some readers may be slow
+     * if the chapter files are too large, so for large documents with few level-1 headings, one might want to use
+     * a chapter level of 2 or 3. For chunked HTML, this option determines how much content goes in each “chunk.”
+     */
+    public fun splitLevel(number: Int) {
+        options.add("--split-level=$number")
+
+    }
+
+    /**
+     * Specify a template for the filenames in a chunkedhtml document. In the template, %n will be replaced by the chunk
+     * number (padded with leading 0s to 3 digits), %s with the section number of the chunk, %h with the heading text
+     * (with formatting removed), %i with the section identifier. For example, %section-%s-%i.html might be resolved to
+     * section-1.1-introduction.html. The characters / and \ are not allowed in chunk templates and will be ignored.
+     * The default is %s-%i.html.
+     * @param pathTemplate : by default is %s-%i.html
+     */
+    public fun chunkTemplate(pathTemplate: String) {
+        options.add("--chunk-template=$pathTemplate")
+
+    }
+
+    /**
+     * Use the specified image as the EPUB cover. It is recommended that the image be less than 1000px in width and
+     * height. Note that in a Markdown source document you can also specify cover-image in a YAML metadata block
+     * (see EPUB Metadata, below).
+     */
+    public fun epubCoverImage(file: Path) {
+        options.add("--epub-cover-image=$file")
+
+    }
+
+    /**
+     * Determines whether a title page is included in the EPUB (default is true).
+     */
+    public fun epubTitlePage(addTitle: Boolean) {
+        options.add("--epub-title-page=$addTitle")
+
+    }
+
+    /**
+     * Look in the specified XML file for metadata for the EPUB. The file should contain a series of Dublin Core elements
+     * For example:
+     * <dc:rights>Creative Commons</dc:rights>
+     * <dc:language>es-AR</dc:language>
+     * By default, pandoc will include the following metadata elements:
+     * <dc:title> (from the document title),
+     * <dc:creator> (from the document authors),
+     * <dc:date> (from the document date, which should be in ISO 8601 format),
+     * <dc:language> (from the lang variable, or, if is not set, the locale),
+     * and <dc:identifier id="BookId"> (a randomly generated UUID).
+     * Any of these may be overridden by elements in the metadata file.
+     * Note: if the source document is Markdown, a YAML metadata block in the document can be used instead.
+     * See [EPUB Metadata](https://pandoc.org/MANUAL.html#epub-metadata).
+     */
+    public fun epubMetadata(file: Path) {
+        options.add("--epub-metadata=$file")
+
+    }
+
+    /**
+     * Embed the specified font in the EPUB. This option can be repeated to embed multiple fonts. Wildcards can also be
+     * used: for example, DejaVuSans-*.ttf. However, if you use wildcards on the command line, be sure to escape them
+     * or put the whole filename in single quotes, to prevent them from being interpreted by the shell.
+     * To use the embedded fonts, you will need to add declarations like the following to your CSS
+     * (see [.linkToCss]):
+     * `{
+     * font-family: DejaVuSans;
+     * font-style: normal;
+     * font-weight: normal;
+     * src:url("../fonts/DejaVuSans-Regular.ttf");
+     * }
+     * {
+     * font-family: DejaVuSans;
+     * font-style: normal;
+     * font-weight: bold;
+     * src:url("../fonts/DejaVuSans-Bold.ttf");
+     * }
+     * {
+     * font-family: DejaVuSans;
+     * font-style: italic;
+     * font-weight: normal;
+     * src:url("../fonts/DejaVuSans-Oblique.ttf");
+     * }
+     * {
+     * font-family: DejaVuSans;
+     * font-style: italic;
+     * font-weight: bold;
+     * src:url("../fonts/DejaVuSans-BoldOblique.ttf");
+     * }
+     * body { font-family: "DejaVuSans"; }
+    ` *
+     */
+    public fun epubEmbedFont(file: String) {
+        options.add("--epub-embed-font=$file")
+
+    }
+
+    /**
+     * Specify the subdirectory in the OCF container that is to hold the EPUB-specific contents. The default is EPUB.
+     * To put the EPUB contents in the top level, use an empty string.
+     */
+    public fun epubSubdirectory(dir: String) {
+        options.add("--epub-subdirectory=$dir")
+
+    }
+
+    /**
+     * Determines how ipynb output cells are treated.
+     * all means that all the data formats included in the original are preserved.
+     * none means that the contents of data cells are omitted.
+     * best causes pandoc to try to pick the richest data block in each output cell that is compatible
+     * with the output format.
+     * The default is best.
+     * @param option : all|none|best
+     */
+    public fun ipynbOutput(option: String) {
+        options.add("--ipynb-output=$option")
+
+    }
+
+    /**
+     * Use the specified engine when producing PDF output. Valid values are pdflatex, lualatex, xelatex, latexmk,
+     * tectonic, wkhtmltopdf, weasyprint, pagedjs-cli, prince, context, pdfroff, and typst.
+     * If the engine is not in your PATH, the full path of the engine may be specified here.
+     * If this option is not specified, pandoc uses the following defaults depending on the output format
+     * specified using [.formatTo]:
+     * latex or none: pdflatex (other options: xelatex, lualatex, tectonic, latexmk)
+     * context: context
+     * html: wkhtmltopdf (other options: prince, weasyprint, pagedjs-cli; see print-css.rocks for a good introduction
+     * to PDF generation from HTML/CSS)
+     * ms: pdfroff
+     * typst: typst
+     * @param program : pdflatex, lualatex, xelatex, latexmk, tectonic, wkhtmltopdf, weasyprint, pagedjs-cli, prince,
+     * context, pdfroff, and typst
+     */
+    public fun pdfEngine(program: String) {
+        options.add("--pdf-engine=$program")
+
+    }
+
+    /**
+     * Use the given string as a command-line argument to the pdf-engine (see [.pdfEngine]).
+     * For example, to use a persistent directory foo for latexmk’s auxiliary files, use --pdf-engine-opt=-outdir=foo.
+     * Note that no check for duplicate options is done
+     */
+    public fun pdfEngineOption(option: String) {
+        options.add("--pdf-engine-opt=$option")
+
+    }
+
+    /**
+     * Process the citations in the file, replacing them with rendered citations and adding a bibliography. Citation
+     * processing will not take place unless bibliographic data is supplied, either through an external file specified
+     * using the [.bibliography] or the bibliography field in metadata, or via a references section in
+     * metadata containing a list of citations in CSL YAML format with Markdown formatting. The style is controlled by
+     * a CSL stylesheet specified using the [.csl] option or the csl field in metadata.
+     * (If no stylesheet is specified, the chicago-author-date style will be used by default.)
+     * The citation processing transformation may be applied before or after filters or Lua filters
+     * (see [.filter], [.luaFilter]):
+     * these transformations are applied in the order they appear on the command line.
+     * For more information, see [Citations](https://pandoc.org/MANUAL.html#citations)
+     */
+    public fun citationProcessing() {
+        options.add("--citeproc")
+
+    }
+
+    /**
+     * Set the bibliography field in the document’s metadata to FILE, overriding any value set in the metadata.
+     * If you supply this argument multiple times, each FILE will be added to bibliography.
+     * If FILE is not found relative to the working directory,
+     * it will be sought in the resource path (see [.resourcePath]).
+     */
+    public fun bibliography(file: Path) {
+        options.add("--bibliography=$file")
+
+    }
+
+    /**
+     * Set the bibliography field in the document’s metadata to URL, overriding any value set in the metadata.
+     * If you supply this argument multiple times, each URL will be added to bibliography.
+     * File will be fetched via HTTP.
+     * it will be sought in the resource path (see [.resourcePath]).
+     */
+    public fun bibliography(url: URL) {
+        options.add("--bibliography=$url")
+
+    }
+
+    /**
+     * Set the csl field in the document’s metadata to FILE, overriding any value set in the metadata.
+     * (This is equivalent to #metadata(csl, file))
+     * If FILE is not found relative to the working directory, it will be sought in the resource path
+     * (see [.resourcePath]) and finally in the csl subdirectory of the pandoc user data directory.
+     */
+    public fun csl(file: Path) {
+        options.add("--csl=$file")
+
+    }
+
+    /**
+     * Set the csl field in the document’s metadata to URL, overriding any value set in the metadata.
+     * (This is equivalent to #metadata(csl, url)). File will be fetched via HTTP
+     * It will be sought in the resource path (see [.resourcePath])
+     * and finally in the csl subdirectory of the pandoc user data directory.
+     */
+    public fun csl(url: URL) {
+        options.add("--csl=$url")
+
+    }
+
+    /**
+     * Set the citation-abbreviations field in the document’s metadata to FILE, overriding any value set in the metadata
+     * (This is equivalent to #metadata(citation-abbreviations, url))
+     * If FILE is not found relative to the working directory, it will be sought in the resource path
+     * (see [.resourcePath]) and finally in the csl subdirectory of the pandoc user data directory.
+     */
+    public fun citationAbbreviation(file: Path) {
+        options.add("--citation-abbreviations=$file")
+
+    }
+
+    /**
+     * Set the citation-abbreviations field in the document’s metadata to FILE, overriding any value set in the metadata
+     * (This is equivalent to #metadata(citation-abbreviations, url)) File will be fetched via HTTP
+     * File will be sought in the resource path (see [.resourcePath])
+     * and finally in the csl subdirectory of the pandoc user data directory.
+     */
+    public fun citationAbbreviation(url: URL) {
+        options.add("--citation-abbreviations=$url")
+
+    }
+
+    /**
+     * Use natbib for citations in LaTeX output. This option is not for use with the [.citationProcessing] option
+     * or with PDF output. It is intended for use in producing a LaTeX file that can be processed with bibtex.
+     */
+    public fun natlib() {
+        options.add("--natlib")
+
+    }
+
+    /**
+     * Use biblatex for citations in LaTeX output. This option is not for use with the [.citationProcessing]
+     * or with PDF output. It is intended for use in producing a LaTeX file that can be processed with bibtex or biber.
+     */
+    public fun biblatex() {
+        options.add("--biblatex")
+
+    }
+
+    /**
+     * Use MathJax to display embedded TeX math in HTML output. TeX math will be put between \(...\) (for inline math)
+     * or \[...\] (for display math) and wrapped in <span> tags with class math. Then the MathJax JavaScript will
+     * render it. The URL should point to the MathJax.js load script. If a URL is not provided,
+     * a link to the Cloudflare CDN will be inserted.
+    </span> */
+    public fun mathJax(url: Optional<URL>) {
+        if (url.isEmpty) {
+            options.add("--mathjax")
+        } else {
+            options.add("--mathjax=" + url.get())
+        }
+
+    }
+
+    /**
+     * Convert TeX math to MathML (in epub3, docbook4, docbook5, jats, html4 and html5). This is the default
+     * in odt output. MathML is supported natively by the main web browsers and select e-book readers.
+     */
+    public fun mathML() {
+        options.add("--mathml")
+
+    }
+
+    /**
+     * Convert TeX formulas to <img></img> tags that link to an external script that converts formulas to images. The formula
+     * will be URL-encoded and concatenated with the URL provided. For SVG images you can for example use
+     * --webtex https://latex.codecogs.com/svg.latex?. If no URL is specified, the CodeCogs URL generating PNGs will be
+     * used (https://latex.codecogs.com/png.latex?). Note: the --webtex option will affect Markdown output as well as
+     * HTML, which is useful if you’re targeting a version of Markdown without native math support.
+     */
+    public fun webTex(url: Optional<URL>) {
+        if (url.isEmpty) {
+            options.add("--webtex")
+        } else {
+            options.add("--webtex " + url.get())
+        }
+
+    }
+
+    /**
+     * Use KaTeX to display embedded TeX math in HTML output. The URL is the base URL for the KaTeX library.
+     * That directory should contain a katex.min.js and a katex.min.css file.
+     * If a URL is not provided, a link to the KaTeX CDN will be inserted.
+     */
+    public fun kaTex(url: Optional<URL>) {
+        if (url.isEmpty) {
+            options.add("--katex")
+        } else {
+            options.add("--katex " + url.get())
+        }
+
+    }
+
+    /**
+     * Enclose TeX math in <eq> tags in HTML output. The resulting HTML can then be processed by GladTeX to produce
+     * SVG images of the typeset formulas and an HTML file with these images embedded.
+     * pandoc -s --gladtex input.md -o myfile.htex
+     * gladtex -d image_dir myfile.htex
+     * # produces myfile.html and images in image_dir
+     */
+    public fun gladtex() {
+        options.add("--gladtex")
+
+    }
+
+    /**
+     * Print information about command-line arguments to stdout, then exit. This option is intended primarily for use
+     * in wrapper scripts. The first line of output contains the name of the output file specified with the -o option,
+     * or - (for stdout) if no output file was specified. The remaining lines contain the command-line arguments,
+     * one per line, in the order they appear. These do not include regular pandoc options and their arguments,
+     * but do include any options appearing after a -- separator at the end of the line.
+     */
+    public fun dumpArgs() {
+        options.add("--dump-args")
+
+    }
+
+    /**
+     * Ignore command-line arguments (for use in wrapper scripts). Regular pandoc options are not ignored. For example,
+     * pandoc --ignore-args -o foo.html -s foo.txt -- -e latin1
+     * is equivalent to
+     * pandoc -o foo.html -s
+     */
+    public fun ignoreArgs() {
+        options.add("--ignore-args")
+
+    }
+}
+
diff --git a/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/PandocInstaller.kt b/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/PandocInstaller.kt
new file mode 100644
index 0000000..bbdb728
--- /dev/null
+++ b/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/PandocInstaller.kt
@@ -0,0 +1,264 @@
+package space.kscience.snark.pandoc
+
+import kotlinx.serialization.json.Json
+import org.apache.commons.compress.archivers.ArchiveEntry
+import org.apache.commons.compress.archivers.tar.TarArchiveInputStream
+import org.apache.commons.compress.compressors.gzip.GzipCompressorInputStream
+import org.apache.commons.exec.OS
+import org.slf4j.Logger
+import org.slf4j.LoggerFactory
+import java.io.BufferedInputStream
+import java.io.FileNotFoundException
+import java.io.IOException
+import java.net.*
+import java.net.http.HttpClient
+import java.net.http.HttpRequest
+import java.net.http.HttpResponse
+import java.nio.file.Files
+import java.nio.file.Path
+import java.nio.file.attribute.PosixFilePermission
+import java.time.Duration
+import java.util.*
+import java.util.zip.ZipInputStream
+import kotlin.io.path.Path
+import kotlin.io.path.inputStream
+
+internal object PandocInstaller {
+
+    private val log: Logger = LoggerFactory.getLogger(PandocInstaller::class.java)
+
+
+    private const val TIMEOUT_SECONDS = 2
+    private const val ATTEMPTS = 3
+
+    private enum class OSType(public val assetSuffix: String, public val propertySuffix: String) {
+        WINDOWS("windows-x86_64.zip", "windows"),
+        MAC_OS_AMD("x86_64-macOS.zip", "mac.os.amd"),
+        MAC_OS_ARM("arm64-macOS.zip", "mac.os.arm"),
+        LINUX_ARM("linux-arm64", "linux.arm"),
+        LINUX_AMD("linux-amd64", "linux.amd")
+    }
+
+    private val properties = Properties().apply {
+        load(PandocInstaller.javaClass.getResourceAsStream("/installer.properties")!!)
+    }
+
+    /**
+     * Install last released pandoc from github
+     * @return path to executable pandoc
+     * @throws IOException in case incorrect github url or path of installation directory
+     */
+    public fun installPandoc(targetPath: Path): Path {
+        log.info("Start install")
+        return if (OS.isFamilyMac()) {
+            if (OS.isArch("aarch64")) {
+                installPandoc(OSType.MAC_OS_ARM, targetPath)
+            } else {
+                installPandoc(OSType.MAC_OS_AMD, targetPath)
+            }
+        } else if (OS.isFamilyUnix()) {
+            if (OS.isArch("aarch64")) {
+                installPandoc(OSType.LINUX_ARM, targetPath)
+            } else {
+                installPandoc(OSType.LINUX_AMD, targetPath)
+            }
+        } else if (OS.isFamilyWindows()) {
+            installPandoc(OSType.WINDOWS, targetPath)
+        } else {
+            error("Got unexpected os, could not install pandoc")
+        }
+    }
+
+
+    private fun installPandoc(os: OSType, targetPath: Path): Path {
+
+        val githubResponse = getGithubUrls()
+        val asset = githubResponse.getAssetByOsSuffix(os.assetSuffix)
+        val currUrl = asset.browserDownloadUrl
+
+        val pandocUrl: URL = URI.create(currUrl).toURL()
+        val fileToInstall: Path = when (os) {
+            OSType.LINUX_AMD, OSType.LINUX_ARM -> Path("$targetPath/pandoc.tar.gz")
+            else -> Path("$targetPath/pandoc.zip")
+        }
+
+        log.info(
+            "Start installing pandoc os: {}, url: {}, file: {}",
+            os,
+            pandocUrl,
+            fileToInstall
+        )
+
+        val archivePath = downloadWithRetry(pandocUrl) ?: error("Could not save file from github")
+        val installPath = unPack(archivePath, targetPath, os) ?: error("Could not unzip file")
+
+
+        val pandocExecutablePath = installPath.resolve(
+            properties.getProperty("path.to.pandoc." + os.propertySuffix).replace(
+                "{version}",
+                githubResponse.tagName
+            )
+        )
+
+        Files.setPosixFilePermissions(pandocExecutablePath, setOf(PosixFilePermission.GROUP_EXECUTE))
+
+        return pandocExecutablePath
+    }
+
+    /**
+     * Downloads from a (http/https) URL and saves to a file.
+     * @param target File to write. Parent directory will be created if necessary
+     * @param url  http/https url to connect
+     * @param secsConnectTimeout Seconds to wait for connection establishment
+     * @param secsReadTimeout Read timeout in seconds - trasmission will abort if it freezes more than this
+     * @return true if successfully save file and false if:
+     * connection interrupted, timeout (but something was read)
+     * server error (500...)
+     * could not connect: connection timeout java.net.SocketTimeoutException
+     * could not connect: java.net.ConnectException
+     * could not resolve host (bad host, or no internet - no dns)
+     * @throws IOException Only if URL is malformed or if could not create the file
+     * @throws FileNotFoundException if did not find file for save
+     */
+    @Throws(IOException::class)
+    private fun downloadUrl(
+        target: Path,
+        url: URL,
+        secsConnectTimeout: Int,
+        secsReadTimeout: Int,
+    ): Path? {
+        Files.createDirectories(target.parent) // make sure parent dir exists , this can throw exception
+        val conn = url.openConnection() // can throw exception if bad url
+        if (secsConnectTimeout > 0) {
+            conn.connectTimeout = secsConnectTimeout * 1000
+        }
+        if (secsReadTimeout > 0) {
+            conn.readTimeout = secsReadTimeout * 1000
+        }
+        var ret = true
+        var somethingRead = false
+        try {
+            conn.getInputStream().use { `is` ->
+                BufferedInputStream(`is`).use { `in` ->
+                    Files.newOutputStream(target).use { fout ->
+                        val data = ByteArray(8192)
+                        var count: Int
+                        while ((`in`.read(data).also { count = it }) > 0) {
+                            somethingRead = true
+                            fout.write(data, 0, count)
+                        }
+                    }
+                }
+            }
+            return target
+        } catch (e: IOException) {
+            var httpcode = 999
+            try {
+                httpcode = (conn as HttpURLConnection).responseCode
+            } catch (ee: Exception) {
+            }
+
+            if (e is FileNotFoundException) {
+                throw FileNotFoundException("Did not found file for install")
+            }
+
+            if (somethingRead && e is SocketTimeoutException) {
+                log.error("Read something, but connection interrupted: {}", e.message, e)
+            } else if (httpcode >= 400 && httpcode < 600) {
+                log.error("Got server error, httpcode: {}", httpcode)
+            } else if (e is SocketTimeoutException) {
+                log.error("Connection timeout: {}", e.message, e)
+            } else if (e is ConnectException) {
+                log.error("Could not connect: {}", e.message, e)
+            } else if (e is UnknownHostException) {
+                log.error("Could not resolve host: {}", e.message, e)
+            } else {
+                throw e
+            }
+            return null
+        }
+    }
+
+    private fun downloadWithRetry(url: URL): Path? {
+        val targetPath = Files.createTempFile("pandoc",".tmp")
+        log.info("Downloading pandoc to $targetPath")
+
+        repeat(ATTEMPTS) {
+            return downloadUrl(
+                targetPath,
+                url,
+                TIMEOUT_SECONDS,
+                TIMEOUT_SECONDS
+            )
+        }
+
+        return null
+    }
+
+    private fun unPack(sourcePath: Path, targetPath: Path, os: OSType): Path? {
+        try {
+            when (os) {
+                OSType.LINUX_AMD, OSType.LINUX_ARM -> unTarGz(sourcePath, targetPath)
+
+                else -> unZip(sourcePath, targetPath)
+            }
+        } catch (e: IOException) {
+            log.error("Could not perform unpacking: {}", e.message, e)
+            return null
+        }
+        return targetPath
+    }
+
+    private fun unTarGz(sourcePath: Path, targetDir: Path) {
+        TarArchiveInputStream(
+            GzipCompressorInputStream(
+                BufferedInputStream(Files.newInputStream(sourcePath))
+            )
+        ).use { tarIn ->
+            var archiveEntry: ArchiveEntry
+            while ((tarIn.nextEntry.also { archiveEntry = it }) != null) {
+                val pathEntryOutput = targetDir.resolve(archiveEntry.name)
+                if (archiveEntry.isDirectory) {
+                    Files.createDirectory(pathEntryOutput)
+                } else {
+                    Files.copy(tarIn, pathEntryOutput)
+                }
+            }
+        }
+    }
+
+    private fun unZip(sourcePath: Path, targetDir: Path) {
+        ZipInputStream(sourcePath.inputStream()).use { zis ->
+            do {
+                val entry = zis.nextEntry
+                if (entry == null) continue
+                val pathEntryOutput = targetDir.resolve(entry.name)
+                if (entry.isDirectory) {
+                    Files.createDirectories(pathEntryOutput)
+                } else {
+                    Files.createDirectories(pathEntryOutput.parent)
+                    Files.copy(zis, pathEntryOutput)
+                }
+                zis.closeEntry()
+            } while (entry != null)
+        }
+    }
+
+    private fun getGithubUrls(): ResponseDto {
+        val uri = URI.create(properties.getProperty("github.url"))
+        val client = HttpClient.newHttpClient()
+        val request = HttpRequest
+            .newBuilder()
+            .uri(uri)
+            .version(HttpClient.Version.HTTP_2)
+            .timeout(Duration.ofMinutes(1))
+            .header("Accept", "application/vnd.github+json")
+            .GET()
+            .build()
+
+        val response = client.send(request, HttpResponse.BodyHandlers.ofString())
+        log.info("Got response from github, status: {}", response.statusCode())
+
+        return Json { ignoreUnknownKeys = true }.decodeFromString(ResponseDto.serializer(), response.body())
+    }
+}
diff --git a/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/ResponseDto.kt b/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/ResponseDto.kt
new file mode 100644
index 0000000..23e16fd
--- /dev/null
+++ b/snark-pandoc/src/jvmMain/kotlin/space/kscience/snark/pandoc/ResponseDto.kt
@@ -0,0 +1,34 @@
+package space.kscience.snark.pandoc
+
+import kotlinx.serialization.SerialName
+import kotlinx.serialization.Serializable
+
+/**
+ * Response from github/releases/latest
+ */
+@Serializable
+internal class ResponseDto(
+    val assets: Array<AssetDto>,
+    @SerialName("tag_name") val tagName: String,
+) {
+    /**
+     * @param osSuffix
+     * @return asset appropriate to os
+     */
+    fun getAssetByOsSuffix(osSuffix: String?): AssetDto {
+        for (asset in assets) {
+            if (asset.name.contains(osSuffix!!)) {
+                return asset
+            }
+        }
+        throw IllegalArgumentException("Unexpected osSuffix")
+    }
+
+
+    @Serializable
+    public class AssetDto(
+        @SerialName("browser_download_url") val browserDownloadUrl: String,
+        val name: String
+    )
+
+}
diff --git a/snark-pandoc/src/jvmMain/resources/installer.properties b/snark-pandoc/src/jvmMain/resources/installer.properties
new file mode 100644
index 0000000..e20b7d5
--- /dev/null
+++ b/snark-pandoc/src/jvmMain/resources/installer.properties
@@ -0,0 +1,8 @@
+path.to.pandoc.mac.os.arm=/pandoc-{version}-arm64/bin/pandoc
+path.to.pandoc.mac.os.amd=/pandoc-{version}-x86_64/bin/pandoc
+path.to.pandoc.windows=/pandoc-{version}/pandoc.exe
+path.to.pandoc.linux.amd=/pandoc-{version}/bin/pandoc
+path.to.pandoc.linux.arm=/pandoc-{version}/bin/pandoc
+
+github.url=https://api.github.com/repos/jgm/pandoc/releases/latest
+
diff --git a/snark-pandoc/src/jvmTest/kotlin/PandocTest.kt b/snark-pandoc/src/jvmTest/kotlin/PandocTest.kt
new file mode 100644
index 0000000..f61b0d9
--- /dev/null
+++ b/snark-pandoc/src/jvmTest/kotlin/PandocTest.kt
@@ -0,0 +1,111 @@
+import org.junit.jupiter.api.Assertions.*
+import org.junit.jupiter.api.Test
+import space.kscience.snark.pandoc.Pandoc
+import java.io.BufferedReader
+import java.io.FileReader
+import java.io.IOException
+import java.nio.file.Files
+import java.nio.file.Path
+import java.util.stream.Collectors
+import kotlin.io.path.Path
+import kotlin.io.path.createDirectories
+import kotlin.io.path.div
+
+class PandocTest {
+    @Test
+    fun when_gotPandocAndCorrectArgs_doConverting() {
+        try {
+            val res = Pandoc.execute {
+                addInputFile(CORRECT_MD)
+                outputFile(TEX_PATH_TO)
+            }
+            assertTrue(res)
+            assertTrue(TEX_PATH_TO.toFile().exists())
+
+            val reader = BufferedReader(FileReader(TEX_PATH_TO.toFile()))
+            val fileString = reader.lines().collect(Collectors.joining())
+
+            assertTrue(fileString.contains("Some simple text"))
+            assertTrue(fileString.contains("\\subsection{Copy elision}"))
+            assertTrue(fileString.contains("return"))
+
+            Files.delete(TEX_PATH_TO)
+        } catch (ex: Exception) {
+            fail<Any>("Unexpected exception during test when_gotPandocAndCorrectArgs_doConverting()", ex)
+        }
+    }
+
+    @Test
+    fun when_gotPandocAndNotExistsFromFile_then_error() {
+        val notExistsFile = Path.of("./src/test/testing_directory/non_exists_test.md")
+        assertFalse(notExistsFile.toFile().exists())
+        val res = Pandoc.execute {
+            addInputFile(notExistsFile)
+            outputFile(TEX_PATH_TO)
+        }
+        assertFalse(res)
+    }
+
+    @Test
+    fun when_gotPandocAndPassDirectory_then_error() {
+        assertTrue(TESTING_DIRECTORY.toFile().isDirectory)
+
+        val res = Pandoc.execute {
+            addInputFile(TESTING_DIRECTORY)
+            outputFile(TEX_PATH_TO)
+        }
+
+        assertFalse(res)
+    }
+
+    @Test
+    fun when_askVersionToFile_then_Ok() {
+        val outputFile = TESTING_DIRECTORY/"output.txt"
+
+        val res = Pandoc.execute(redirectOutput = outputFile) {
+            getVersion()
+        }
+
+        val reader = BufferedReader(FileReader(outputFile.toFile()))
+        val fileString = reader.lines().collect(Collectors.joining())
+        assertTrue(fileString.contains("pandoc"))
+        assertTrue(fileString.contains("This is free software"))
+        assertTrue(res)
+    }
+
+    @Test
+    fun when_error_then_writeToErrorStream() {
+        val outputFile = Files.createTempFile(TESTING_DIRECTORY, "output", ".txt")
+        val errorFile = Files.createTempFile(TESTING_DIRECTORY, "error", ".txt")
+
+        val res = Pandoc.execute(outputFile, errorFile) {
+            addInputFile(Path.of("./simple.txt"))
+            outputFile(TEX_PATH_TO)
+            formatFrom("txt")
+        }
+
+        val reader = BufferedReader(FileReader(errorFile.toFile()))
+        val fileString = reader.lines().collect(Collectors.joining())
+        assertFalse(res)
+        assertTrue(fileString.contains("21"))
+
+        Files.delete(outputFile)
+        Files.delete(errorFile)
+    }
+
+
+//    @Test
+//    fun when_installPandoc_thenFindIt() {
+//        PandocInstaller.clearInstallingDirectory()
+//        assertTrue(Pandoc.installPandoc())
+//        assertTrue(Pandoc.isPandocInstalled())
+//    }
+
+    companion object {
+        private val TESTING_DIRECTORY: Path = Path("./testing_directory").apply {
+            createDirectories()
+        }
+        private val CORRECT_MD: Path = TESTING_DIRECTORY.resolve("first_test.md")
+        private val TEX_PATH_TO: Path = TESTING_DIRECTORY.resolve("output1.tex")
+    }
+}
diff --git a/snark-pandoc/testing_directory/first_test.md b/snark-pandoc/testing_directory/first_test.md
new file mode 100644
index 0000000..e12d918
--- /dev/null
+++ b/snark-pandoc/testing_directory/first_test.md
@@ -0,0 +1,15 @@
+
+
+## Copy elision
+### RVO/NRVO
+Some simple text
+```c++
+A f() {
+    return {5};
+}
+
+A g() {
+    A a(5);
+    return a;
+}
+```
\ No newline at end of file
diff --git a/snark-pandoc/testing_directory/simple.txt b/snark-pandoc/testing_directory/simple.txt
new file mode 100644
index 0000000..b6fc4c6
--- /dev/null
+++ b/snark-pandoc/testing_directory/simple.txt
@@ -0,0 +1 @@
+hello
\ No newline at end of file