根據//a[@target="_blank" a標籤查詢taget屬性是_blank的值
阿新 • • 發佈:2018-12-20
[[email protected] sbin]# cat s1.pl
use LWP::UserAgent;
use DBI;
use POSIX;
use Data::Dumper;
use HTML::TreeBuilder;
my $ua = LWP::UserAgent->new;
$ua->timeout(10);
$ua->env_proxy;
$ua->agent("Mozilla/8.0");
use HTML::TreeBuilder::XPath;
$tree= HTML::TreeBuilder::XPath->new;
$tree->parse_file( "fh2.html");
my @title= $tree->findvalues('//a[@target="_blank"]');
print @title;
[ [email protected] sbin]#
[[email protected] sbin]#
[[email protected] sbin]# cat fh2.html
<div class="daohang-kuai">
<div class="daohang-org"><span>合規部</span></div>
<div class="daohang-links"><a href="http://10.3.246.2:7001/newaml?tgt=TGT-518341-bAJd4aeK0sZnlJQC3ET2U2VPUCSDmNlMm3dq0VITiIrOQUx6ik-cas01.example.org" target="_blank">反洗錢系統</a> <span >|</span><a href="/tailong/syslink/goAml.jsp?tgt=TGT-518341-bAJd4aeK0sZnlJQC3ET2U2VPUCSDmNlMm3dq0VITiIrOQUx6ik-cas01.example.org" target="_blank">新一代反洗錢工作平臺</a> <span >|</span><div class="clear"></div></div><div class="daohang-links"><a href="/tailong/syslink/oaforward.jsp?idName=crmis&tgt=TGT-518341-bAJd4aeK0sZnlJQC3ET2U2VPUCSDmNlMm3dq0VITiIrOQUx6ik-cas01.example.org" target="_blank">合規和操作風險管理系統</a> <span >|</span><a href="http://10.3.200.16:7001/UtanWeb/index.jsp?tgt=TGT-518341-bAJd4aeK0sZnlJQC3ET2U2VPUCSDmNlMm3dq0VITiIrOQUx6ik-cas01.example.org" target="_blank">黑名單監控管理系統</a> <span >|</span><div class="clear"></div></div>
</div>
</div>
</div>
</div>
<a target='ff'>8888999gdsgdhg</a>
<a target='_blank'>732332</a>
<a target='_blank1'>寺昌</a>
You have mail in /var/spool/mail/root
[ [email protected] sbin]# vim fh2.html
[[email protected] sbin]# perl s1.pl
反洗錢系統新一代反洗錢工作平臺合規和操作風險管理系統黑名單監控管理系統732332[[email protected] sbin]#