1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105 | package Torello.HTML.NodeSearch.SearchLoops.TagNodesInclusive;
import java.util.Vector;
import java.util.stream.IntStream;
import Torello.HTML.*;
import Torello.HTML.NodeSearch.InclusiveException;
import Torello.Java.LV;
public class TNRemoveIncl
{
public static int nth (Vector<? extends HTMLNode> html, int nth, LV l, String... htmlTags)
{
InclusiveException.check(htmlTags);
DotPair dp;
HTMLNode n;
for (int i = l.start; i < l.end; i++)
if (
((n = html.elementAt(i)).isTagNode())
&& (((TagNode) n).isTag(TC.OpeningTags, htmlTags))
&& ((dp = Util.Inclusive.dotPairOPT(html, i, l.end)) != null)
&& (--nth == 0)
)
// { Util.Remove.range(html, dp.start, dp.end + 1); return dp.size(); }
{ html.subList(dp.start, dp.end + 1).clear(); return dp.size(); }
return 0;
}
public static int nthFromEnd
(Vector<? extends HTMLNode> html, int nth, LV l, String... htmlTags)
{
InclusiveException.check(htmlTags);
DotPair dp;
HTMLNode n;
for (int i = l.end-1; i >= l.start; i--)
if (
((n = html.elementAt(i)).isTagNode())
&& (((TagNode) n).isTag(TC.OpeningTags, htmlTags))
&& ((dp = Util.Inclusive.dotPairOPT(html, i, l.end)) != null)
&& (--nth == 0)
)
// { Util.Remove.range(html, dp.start, dp.end + 1); return dp.size(); }
{ html.subList(dp.start, dp.end + 1).clear(); return dp.size(); }
return 0;
}
public static int all (Vector<? extends HTMLNode> html, LV l, String... htmlTags)
{
InclusiveException.check(htmlTags);
Vector<DotPair> dpMatches = new Vector<>();
DotPair dp;
HTMLNode n;
for (int i = l.start; i < l.end; i++)
if (
((n = html.elementAt(i)).isTagNode())
&& (((TagNode) n).isTag(TC.OpeningTags, htmlTags))
&& ((dp = Util.Inclusive.dotPairOPT(html, i, l.end)) != null)
)
dpMatches.addElement(dp);
// Remove the nodes out of the original page.
int[] removeArr = DPUtil.toPosArray(dpMatches, true);
Util.Remove.nodesOPT(html, removeArr);
return removeArr.length;
}
public static int allExcept (Vector<? extends HTMLNode> html, LV l, String... htmlTags)
{
InclusiveException.check(htmlTags);
Vector<DotPair> dpMatches = new Vector<>();
DotPair dp;
HTMLNode n;
for (int i = l.start; i < l.end; i++)
if (
((n = html.elementAt(i)).isTagNode())
&& (((TagNode) n).isTagExcept(TC.OpeningTags, htmlTags))
&& ((dp = Util.Inclusive.dotPairOPT(html, i, l.end)) != null)
)
dpMatches.addElement(dp);
// Remove the nodes out of the original page.
int[] removeArr = DPUtil.toPosArray(dpMatches, true);
Util.Remove.nodesOPT(html, removeArr);
return removeArr.length;
}
}
|