1,两个小时学会perl
http://qntm.org/files/perl/perl.html
2,Python整站爬虫(Demo)(依赖Mysql)
3,JAVA构造器的实际使用package basic.day12;
public class User {
String name;
String pwd;
int age;
public User(String name,String pwd,int age){
this.name=name;
this.pwd=pwd;
this.age=age;
}
public String toString(){
return name+":"+age;
}
}
4,Perl爬虫动手(抓首页)
下面的代码目前只实现了抓取首页,后面会改下,要求抓2级到3级页面
#!/usr/bin/perl
use HTML::LinkExtor;
use LWP::Simple;
sub sparit{
local($base_url)= shift;
# 抓取URL
$parser = HTML::LinkExtor->new(undef,$base_url);
$parser->parse(get($base_url))->eof;
@links = $parser->links;
foreach $linkarray (@links){
my @element = @$linkarray;
my $elt_type = shift @element;
while( @element){
my ($attr_name , $attr_value) = splice(@element, 0, 2);
$seen{$attr_value}++;
}
}
# 排序/去除非同站URL
for (sort keys %seen){
if($_=~m#^$base_url#){
push(@tmp_url,"$_\n");
}
}
# 返回匹配的URL
return @tmp_url;
}
5,Python字符串处理例子
#!/usr/bin/python
#coding=gb2312
line='aa,bb,cc,dd';
print line.split(',');
w='start';
s='wic\n';
print w.upper();
print w.isalpha();
print s.rstrip();
print '%s,caonima,de,%s' %('wo','b');
print '{0},caonima,de,{1}'.format('cao', 'nidaye');