1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
|
package model.html;
import model.html.ElementNode;
import model.html.HtmlParser;
import model.html.TextNode;
import model.util.Node;
import org.javatuples.Pair;
import org.junit.jupiter.api.Test;
import java.util.*;
import static org.junit.jupiter.api.Assertions.*;
public class HtmlParserTest {
String idiomaticHtml = "<!DOCTYPE html><html><head></head><body><p>Hello, world!</p></body></html>";
String brokenHtml = "<html><foo><bar></bar><><ba";
String trailingTextHtml = "bot<html><foo><bar></bar>ba";
String attributesHtml = "<html><attr hello=\"world\" foo='bar' strange=\"cha\\\"rm\" up='do\\'wn'></attr></html>";
@Test
void testIdiomaticHtml() {
ArrayList<Node> expected = new ArrayList<>();
ArrayList<Node> expectedChildren = new ArrayList<>();
ArrayList<Node> expectedGrandChildren = new ArrayList<>();
ArrayList<Node> expectedGreatGrandChildren = new ArrayList<>();
expected.add(new ElementNode("html", new ArrayList<>(), expectedChildren));
expectedChildren.add(new ElementNode("head"));
expectedChildren.add(new ElementNode("body", new ArrayList<>(), expectedGrandChildren));
expectedGrandChildren.add(new ElementNode("p", new ArrayList<>(), expectedGreatGrandChildren));
expectedGreatGrandChildren.add(new TextNode("Hello, world!"));
HtmlParser parser = new HtmlParser();
assertEqualsHtml(parser.parseHtml(idiomaticHtml), expected);
// displayHtmlTree(parser.parseHtml(idiomaticHtml));
}
@Test
void testBrokenHtml() {
ArrayList<Node> expected = new ArrayList<>();
ArrayList<Node> expectedChildren = new ArrayList<>();
ArrayList<Node> expectedGrandChildren = new ArrayList<>();
expected.add(new ElementNode("html", new ArrayList<>(), expectedChildren));
expectedChildren.add(new ElementNode("foo", new ArrayList<>(), expectedGrandChildren));
expectedGrandChildren.add(new ElementNode("bar", new ArrayList<>()));
expectedGrandChildren.add(new TextNode("<>"));
HtmlParser parser = new HtmlParser();
assertEqualsHtml(parser.parseHtml(brokenHtml), expected);
// displayHtmlTree(parser.parseHtml(brokenHtml));
}
@Test
void testTrailingTextHtml() {
ArrayList<Node> expected = new ArrayList<>();
ArrayList<Node> expectedChildren = new ArrayList<>();
ArrayList<Node> expectedGrandChildren = new ArrayList<>();
expected.add(new TextNode("bot"));
expected.add(new ElementNode("html", new ArrayList<>(), expectedChildren));
expected.add(new TextNode("ba"));
expectedChildren.add(new ElementNode("foo", new ArrayList<>(), expectedGrandChildren));
expectedGrandChildren.add(new ElementNode("bar", new ArrayList<>()));
HtmlParser parser = new HtmlParser();
assertEqualsHtml(parser.parseHtml(trailingTextHtml), expected);
// displayHtmlTree(parser.parseHtml(trailingTextHtml));
}
@Test
void testAttributesHtml() {
ArrayList<Node> expected = new ArrayList<>();
ArrayList<Node> expectedChildren = new ArrayList<>();
ArrayList<Pair<String, String>> expectedAttributes = new ArrayList<>();
expected.add(new ElementNode("html", new ArrayList<>(), expectedChildren));
expectedChildren.add(new ElementNode("attr", expectedAttributes));
expectedAttributes.add(new Pair<>("hello", "world"));
expectedAttributes.add(new Pair<>("foo", "bar"));
expectedAttributes.add(new Pair<>("strange", "cha\"rm"));
expectedAttributes.add(new Pair<>("up", "do'wn"));
HtmlParser parser = new HtmlParser();
ArrayList<Node> parsed = parser.parseHtml(attributesHtml);
displayHtmlTree(parsed);
assertEqualsHtml(parsed, expected);
}
/**
* Complicated helper function for tests.
*/
private static void assertEqualsHtml(ArrayList<Node> html, ArrayList<Node> expected) {
for (int i = 0; i < html.size(); i++) {
assertEquals(html.get(i).getData(), expected.get(i).getData());
// System.out.println(html.get(i).getData() + " " + expected.get(i).getData());
if (html.get(i) instanceof ElementNode) {
assertEqualsHtml(((ElementNode) html.get(i)).getChildren(), ((ElementNode) expected.get(i)).getChildren());
}
}
}
/**
* Simple helper function for debugging.
* EFFECTS: prints a representation of the tree to the console for debugging purposes
*/
private void displayHtmlTree(ArrayList<Node> tree) {
for (Node node : tree) {
if (node instanceof ElementNode) {
System.out.print(((ElementNode) node).getTag() + ": ");
for (Node n : ((ElementNode) node).getChildren()) {
System.out.print(n.getData() + " ");
}
System.out.println();
displayHtmlTree(((ElementNode) node).getChildren());
} else {
System.out.println("Text: " + node.getData());
}
}
}
}
|