inc_coonepage.php

来自「这是matlab的一个小程序」· PHP 代码 · 共 101 行

PHP
101
字号
<?php
//采集指定页面作为文章发布源
require_once(DEDEINC.'/charset.func.php');
function CoOnePage($gurl)
{
	global $dsql,$cfg_auot_description, $cfg_soft_lang;
	$redatas = array('title' => '','body' => '','source' => '','writer' => '','description' => '','keywords' => '');
	$redatas['source'] = preg_replace("/http:\/\//i","",$gurl);
	$redatas['source'] = preg_replace("/\/(.*)$/i","",$redatas['source']);
	$row = $dsql->GetOne("Select * From `#@__co_onepage` where url like '".$redatas['source']."' ");
	$s = $e = '';
	if(is_array($row))
	{
		list($s,$e) = explode('{@body}',$row['rule']);
		$s = trim($s);
		$e = trim($e);
		if($row['issource']==1)
		{
			$redatas['source'] = $row['title'];
		}
	}
	$htd = new DedeHttpDown();
	$htd->OpenUrl($gurl);
	$body = $htd->GetHtml();
	if($body!='')
	{
		//编码自动转换
		if($cfg_soft_lang=='utf-8')
		{
	 			if($row['lang']=='gb2312')
	 			{
	 				$body = gb2utf8($body);
	 			}
		}
		else if($cfg_soft_lang=='gb2312')
		{
				if($row['lang']=='utf-8')
				{
					$body = utf82gb($body);
				}
		}

		//获取标题
		$inarr = array();
		preg_match("/<title>(.*)<\/title>/isU",$body,$inarr);
		if(isset($inarr[1]))
		{
			$redatas['title'] = $inarr[1];
		}

		//获取关键词
		$inarr = array();
		preg_match("/<meta[\s]+name=['\"]keywords['\"] content=['\"](.*)['\"]/isU",$body,$inarr);
		if(isset($inarr[1]))
		{
			$redatas['keywords'] = cn_substr(html2text($inarr[1]),30);
		}

		//获取摘要
		$inarr = array();
		preg_match("/<meta[\s]+name=['\"]description['\"] content=['\"](.*)['\"]/isU",$body,$inarr);
		if(isset($inarr[1]))
		{
			$redatas['description'] = cn_substr(html2text($inarr[1]),$cfg_auot_description);
		}

		//获取内容
		if($s!='' && $e!='')
		{
			$redatas['body'] = GetHtmlAreaA($s,$e,$body);
			if($redatas['body']!='' && $redatas['description']=='')
			{
				$redatas['description'] = cn_substr(html2text($redatas['body']),$GLOBALS['cfg_auot_description']);
			}
		}
	}
	return $redatas;
}

//获取特定区域的HTML
function GetHtmlAreaA($s,$e,&$html)
{
	if($html==""||$s=="")
	{
		return "";
	}
	$posstart = @strpos($html,$s);
	if($posstart===false)
	{
		return "";
	}
	$posend = strpos($html,$e,$posstart);
	if($posend > $posstart && $posend!==false)
	{
		return substr($html,$posstart+strlen($s),$posend-$posstart-strlen($s));
	}else
	{
		return '';
	}
}
?>

⌨️ 快捷键说明

复制代码Ctrl + C
搜索代码Ctrl + F
全屏模式F11
增大字号Ctrl + =
减小字号Ctrl + -
显示快捷键?