2 * Copyright 2005 the original author or authors.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
17 package org.wamblee.crawler;
19 import org.apache.commons.httpclient.NameValuePair;
23 * The object that actually obtains pages based on URL.
25 public interface Crawler {
28 * Gets the content for a specific page.
29 * @param aUrl Url of page.
30 * @param aParameters Paremeters to supply.
31 * @return Page to retrieve.
32 * @throws PageException In case of problems retrieving the page.
34 Page getPage(String aUrl, NameValuePair[] aParameters) throws PageException;
37 * Gets the content for a specific page.
38 * @param aUrl Url of page.
39 * @param aParameters Parameters to supply.
40 * @param aType Type of page.
42 * @throws PageException In case of problems retrieving the page.
44 Page getPage(String aUrl, NameValuePair[] aParameters, PageType aType) throws PageException;