-
Notifications
You must be signed in to change notification settings - Fork 271
/
DocxConverterPegdown.java
108 lines (97 loc) · 4.32 KB
/
DocxConverterPegdown.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
package com.vladsch.flexmark.java.samples;
import com.vladsch.flexmark.docx.converter.DocxRenderer;
import com.vladsch.flexmark.parser.Parser;
import com.vladsch.flexmark.profile.pegdown.Extensions;
import com.vladsch.flexmark.profile.pegdown.PegdownOptionsAdapter;
import com.vladsch.flexmark.util.ast.Node;
import com.vladsch.flexmark.util.data.DataHolder;
import org.apache.commons.io.IOUtils;
import org.docx4j.Docx4J;
import org.docx4j.openpackaging.exceptions.Docx4JException;
import org.docx4j.openpackaging.packages.WordprocessingMLPackage;
import java.io.File;
import java.io.IOException;
import java.io.InputStream;
import java.io.StringWriter;
public class DocxConverterPegdown {
// don't need to use pegdown options adapter. You can setup the options as you like. I find this is a quick way to add all the fixings
static final DataHolder OPTIONS = PegdownOptionsAdapter.flexmarkOptions(
Extensions.ALL & ~(Extensions.ANCHORLINKS | Extensions.EXTANCHORLINKS_WRAP))
.toMutable()
.set(DocxRenderer.SUPPRESS_HTML, true)
// the DocxLinkResolver is added automatically, or alternately set it to false and add your own link resolver
//.set(DocxRenderer.DEFAULT_LINK_RESOLVER, true)
.set(DocxRenderer.DOC_RELATIVE_URL, "file:///Users/vlad/src/pdf") // this will be used for URLs like 'images/...' or './' or '../'
.set(DocxRenderer.DOC_ROOT_URL, "file:///Users/vlad/src/pdf") // this will be used for URLs like: '/...'
.toImmutable();
static String getResourceFileContent(String resourcePath) {
StringWriter writer = new StringWriter();
getResourceFileContent(writer, resourcePath);
return writer.toString();
}
private static void getResourceFileContent(StringWriter writer, String resourcePath) {
InputStream inputStream = DocxConverterPegdown.class.getResourceAsStream(resourcePath);
try {
IOUtils.copy(inputStream, writer, "UTF-8");
inputStream.close();
} catch (IOException e) {
e.printStackTrace();
}
}
public static void main(String[] args) {
String markdown = "#Heading\n" +
"-----\n" +
"paragraph text \n" +
"lazy continuation\n" +
"\n" +
"* list item\n" +
" > block quote\n" +
" lazy continuation\n" +
"\n" +
"~~~info\n" +
" with uneven indent\n" +
" with uneven indent\n" +
"indented code\n" +
"~~~ \n" +
"\n" +
" with uneven indent\n" +
" with uneven indent\n" +
" indented code\n" +
"1. numbered item 1 \n" +
"1. numbered item 2 \n" +
"1. numbered item 3 \n" +
" - bullet item 1 \n" +
" - bullet item 2 \n" +
" - bullet item 3 \n" +
" 1. numbered sub-item 1 \n" +
" 1. numbered sub-item 2 \n" +
" 1. numbered sub-item 3 \n" +
" \n" +
" ~~~info\n" +
" with uneven indent\n" +
" with uneven indent\n" +
" indented code\n" +
" ~~~ \n" +
" \n" +
" with uneven indent\n" +
" with uneven indent\n" +
" indented code\n" +
"";
System.out.println("markdown\n");
System.out.println(markdown);
Parser PARSER = Parser.builder(OPTIONS).build();
DocxRenderer RENDERER = DocxRenderer.builder(OPTIONS).build();
Node document = PARSER.parse(markdown);
// to get XML
String xml = RENDERER.render(document);
// or to control the package
WordprocessingMLPackage template = DocxRenderer.getDefaultTemplate();
RENDERER.render(document, template);
File file = new File("/Users/vlad/src/pdf/flexmark-java.docx");
try {
template.save(file, Docx4J.FLAG_SAVE_ZIP_FILE);
} catch (Docx4JException e) {
e.printStackTrace();
}
}
}