robots.h
来自「网络爬虫程序」· C头文件 代码 · 共 29 行
H
29 行
/***************************************************************************//* This code is part of WWW grabber called pavuk *//* Copyright (c) 1997 - 2001 Stefan Ondrejicka *//* Distributed under GPL 2 or later *//***************************************************************************/#ifndef _robots_h_#define _robots_h_#include "tools.h"#include "mt.h"#include "url.h"typedef struct{ char *site; /*** host name of server for "robots.txt" checking ***/ int port; /*** server port ***/ char **dpat; /*** list of disallowed prefixes ***/ char **apat; /*** list of allowed prefixes */#ifdef HAVE_MT pthread_mutex_t lock; /*** lock to prevent downloading concurrently with multiple threads ***/#endif} robotlim;extern bool_t robots_check(url *);extern void robots_do_cleanup(void);#endif
⌨️ 快捷键说明
复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?