2 * Copyright 2005 the original author or authors.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
17 package org.wamblee.crawler.kiss.main;
19 import java.io.InputStream;
20 import java.util.ArrayList;
21 import java.util.Iterator;
22 import java.util.List;
24 import org.dom4j.Attribute;
25 import org.dom4j.Document;
26 import org.dom4j.DocumentException;
27 import org.dom4j.Element;
28 import org.dom4j.io.SAXReader;
29 import org.wamblee.conditions.AndCondition;
30 import org.wamblee.conditions.Condition;
31 import org.wamblee.conditions.PropertyRegexCondition;
32 import org.wamblee.crawler.kiss.guide.Program;
33 import org.wamblee.xml.XslTransformer;
36 * Parse the configuration of desired programs.
38 class ProgramConfigurationParser {
39 private static final int DEFAULT_SMTP_PORT = 25;
41 private static final int DEFAULT_PRIORITY = 1;
43 // Formatting configuration.
44 private static final String ELEM_FORMAT = "format";
46 private static final String ELEM_TEXT = "text";
48 private static final String ELEM_HTML = "html";
50 // Configuration of interesting programs.
52 private static final String ELEM_PROGRAM = "program";
54 private static final String ELEM_PRIORITY = "priority";
56 private static final String ELEM_PATTERN = "match";
58 private static final String ELEM_ACTION = "action";
60 private static final String ELEM_CATEGORY = "category";
62 private static final String ACTION_NOTIFY = "notify";
64 private List<ProgramFilter> _filters;
66 private XslTransformer _transformer;
68 ProgramConfigurationParser(XslTransformer aTransformer) {
70 _transformer = aTransformer;
74 * Parses the condition used to match the desired programs.
77 * Input stream to parse from.
80 void parse(InputStream aStream) {
81 List<ProgramFilter> filters = new ArrayList<ProgramFilter>();
83 SAXReader reader = new SAXReader();
84 Document document = reader.read(aStream);
86 Element root = document.getRootElement();
88 for (Iterator i = root.elementIterator(ELEM_PROGRAM); i.hasNext();) {
89 Element program = (Element) i.next();
91 Element categoryElem = program.element(ELEM_CATEGORY);
93 if (categoryElem != null) {
94 category = categoryElem.getText().trim();
97 Element actionElem = program.element(ELEM_ACTION);
98 int priority = DEFAULT_PRIORITY;
99 String priorityString = program.elementTextTrim(ELEM_PRIORITY);
100 if ( priorityString != null ) {
101 priority = Integer.valueOf(priorityString);
103 ProgramAction action = new RecordProgramAction(priority);
104 if (actionElem != null) {
105 if (actionElem.getText().equals(ACTION_NOTIFY)) {
106 action = new InterestingProgramAction(category);
110 List<Condition<Program>> regexConditions = new ArrayList<Condition<Program>>();
111 for (Iterator j = program.elementIterator(ELEM_PATTERN); j
113 Element patternElem = (Element) j.next();
114 String fieldName = "name";
115 Attribute fieldAttribute = patternElem.attribute("field");
116 if (fieldAttribute != null) {
117 fieldName = fieldAttribute.getText();
119 String pattern = ".*(" + patternElem.getText() + ").*";
120 regexConditions.add(new PropertyRegexCondition<Program>(
121 fieldName, pattern, true));
123 Condition<Program> condition = new AndCondition<Program>(
125 filters.add(new ProgramFilter(condition, action));
128 } catch (DocumentException e) {
129 throw new RuntimeException("Error parsing program configuraiton", e);
134 * Returns the list of program filters.
136 * @return Filter list.
138 public List<ProgramFilter> getFilters() {