(no commit message)
[utils] / crawler / kiss / src / org / wamblee / crawler / kiss / ProgramConfigurationParser.java
index 71719799c2162296902da68e8f6c7612382fc5b0..2c05b827233a82888c34be1452ef07e8ed5ff269 100644 (file)
@@ -21,21 +21,28 @@ import java.util.ArrayList;
 import java.util.Iterator;
 import java.util.List;
 
+import org.dom4j.Attribute;
 import org.dom4j.Document;
 import org.dom4j.DocumentException;
 import org.dom4j.Element;
 import org.dom4j.io.SAXReader;
+import org.wamblee.conditions.AndCondition;
 import org.wamblee.conditions.Condition;
-import org.wamblee.conditions.OrCondition;
+import org.wamblee.conditions.PropertyRegexCondition;
+import org.wamblee.crawler.kiss.ProgramFilter.ProgramAction;
 
 /**
  * Parse the configuration of desired programs.
  */
-public class ProgramConfigurationParser {
-    
-    
+class ProgramConfigurationParser {
+
     private static final String ELEM_PROGRAM = "program";
-    private static final String ELEM_PATTERN = "name";
+
+    private static final String ELEM_PATTERN = "match";
+
+    private static final String ELEM_ACTION = "action";
+
+    private static final String ACTION_NOTIFY = "notify";
 
     /**
      * Parses the condition used to match the desired programs.
@@ -44,20 +51,41 @@ public class ProgramConfigurationParser {
      *            Input stream to parse from.
      * @return Condition.
      */
-    Condition<Program> parse(InputStream aStream) {
+    List<ProgramFilter> parse(InputStream aStream) {
+        List<ProgramFilter> filters = new ArrayList<ProgramFilter>();
         try {
             SAXReader reader = new SAXReader();
             Document document = reader.read(aStream);
 
             Element root = document.getRootElement();
-            List<Condition<Program>> conditions = new ArrayList<Condition<Program>>();
 
-            for (Iterator i = root.elementIterator(ELEM_PROGRAM); i.hasNext(); ) {
-                Element program = (Element)i.next();
-                String pattern = ".*" + program.element(ELEM_PATTERN).getText() + ".*";
-                conditions.add(new ProgramNameMatcher(pattern)); 
+            for (Iterator i = root.elementIterator(ELEM_PROGRAM); i.hasNext();) {
+                Element program = (Element) i.next();
+
+                Element actionElem = program.element(ELEM_ACTION);
+                ProgramAction action = ProgramAction.RECORD;
+                if (actionElem != null) {
+                    if (actionElem.getText().equals(ACTION_NOTIFY)) {
+                        action = ProgramAction.NOTIFY;
+                    }
+                }
+                List<Condition<Program>> regexConditions = 
+                    new ArrayList<Condition<Program>>();
+                for (Iterator j = program.elementIterator(ELEM_PATTERN); j.hasNext(); ) {
+                    Element patternElem = (Element)j.next();
+                    String fieldName = "name"; 
+                    Attribute fieldAttribute = patternElem.attribute("field"); 
+                    if ( fieldAttribute != null ) { 
+                        fieldName = fieldAttribute.getText(); 
+                    }
+                    String pattern = ".*(" + patternElem.getText()
+                    + ").*";
+                    regexConditions.add(new PropertyRegexCondition<Program>(fieldName, pattern, true));
+                }
+                Condition<Program> condition = new AndCondition<Program>(regexConditions);
+                filters.add(new ProgramFilter(condition, action));
             }
-            return new OrCondition<Program>(conditions);
+            return filters;
         } catch (DocumentException e) {
             throw new RuntimeException("Error parsing program configuraiton", e);
         }