testvisitlinkedpages.java

来自「用来为垂直搜索引擎抓取数据的采集系统」· Java 代码 · 共 43 行

JAVA
43
字号
/*
 * *****************************************************
 * Copyright (c) 2005 IIM Lab. All  Rights Reserved.
 * Created by xuehao at 2005-10-12
 * Contact: zxuehao@mail.ustc.edu.cn
 * *****************************************************
 */

package org.indigo.tests.pages;

import java.util.ArrayList;
import java.util.HashSet;

import org.indigo.pages.VisitLinkedPages;

import junit.framework.TestCase;

public class TestVisitLinkedPages extends TestCase
{

    public void testVisitLinkedPages()
    {
        ArrayList urls = new ArrayList();
        urls.add( 0, "http://www.ahnw.gov.cn/scxx/schq/index.asp?datetime=&page=1&zl=80%CB%AE%B9%FB&diqu=&chanpin=&dl=01%C5%A9%B8%B1&NewDay=0" );
        urls.add( 1, "http://www.ahnw.gov.cn/scxx/schq/index.asp?datetime=&page=1&zl=30%CA%DF%B2%CB&diqu=&chanpin=&dl=01%C5%A9%B8%B1&NewDay=0" );
        urls.add( 2, "http://www.ahnw.gov.cn/scxx/schq/index.asp?datetime=&page=1&zl=70%CB%AE%B2%FA%C6%B7&diqu=&chanpin=&dl=01%C5%A9%B8%B1&NewDay=0" );

        VisitLinkedPages vPages = new VisitLinkedPages( "page" );
        vPages.setLinkedUrls( urls );
        vPages.setParameters( 1, 3, 1 );
        
        String url=null;

        url = vPages.getNextVisitLink();
        while( url!=null )
        {
            System.out.println( url );
            url = vPages.getNextVisitLink();
        }
        
    }
}

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?