锘??xml version="1.0" encoding="utf-8" standalone="yes"?>久久亚洲精品国产精品婷婷,亚洲婷婷综合色高清在线,国产v亚洲v天堂无码网站http://m.tkk7.com/ibmsoft/ibmsoft 鍔姏涓嶄竴瀹氭垚鍔?鏀懼純涓瀹氬け璐? 鍧氭寔鑷繁鐨勭悊鎯?瀹炵幇鑷繁鐨勭洰鏍? 鏈夊ソ鐨勬兂娉曞氨瑕佸嚭鎯沖姙娉曞疄鐜?zh-cnSun, 06 Jul 2025 06:11:08 GMTSun, 06 Jul 2025 06:11:08 GMT60appfuse 鍐嶅涔狅紒http://m.tkk7.com/ibmsoft/archive/2006/08/11/63038.htmlibmsoftibmsoftFri, 11 Aug 2006 08:44:00 GMThttp://m.tkk7.com/ibmsoft/archive/2006/08/11/63038.htmlhttp://m.tkk7.com/ibmsoft/comments/63038.htmlhttp://m.tkk7.com/ibmsoft/archive/2006/08/11/63038.html#Feedback0http://m.tkk7.com/ibmsoft/comments/commentRss/63038.htmlhttp://m.tkk7.com/ibmsoft/services/trackbacks/63038.html
鐢ㄦ渶鏂扮殑appfuse1.9.3鐗堟湰錛?br />
鍒?http"://appfuse.org/涓嬭澆appfuse1.93

鐢╥dea鎵撳紑
鍙渶瑕佷慨鏀筽roperties.xml涓殑
聽聽聽聽<!--聽Defaults聽for聽database.properties聽-->
聽聽聽聽
<property聽name="database.jar"聽location="${mysql.jar}"/>
聽聽聽聽
<property聽name="database.type"聽value="mysql"/>
聽聽聽聽
<property聽name="database.name"聽value="appfuse"/>
聽聽聽聽
<property聽name="database.host"聽value="localhost"/>
聽聽聽聽
<property聽name="database.username"聽value="root"/>
聽聽聽聽
<property聽name="database.password"聽value="root"/>

鎶婂叾涓殑localhost淇敼鎴愬疄闄呯殑ip灝眔k浜?br />姣斿璇存槸錛?92.169.0.1:3306錛屾敞鎰忎竴瀹氳鍔犱笂绔彛鍙鳳紒

鐒跺悗鍦╝nt涓繍琛岀浉鍏崇殑浠誨姟錛?br />鎴戣繖閲岀殑鎯呭喌鏄細
寤烘暟鎹簱琛ㄥ拰鏁版嵁鐨勪笉璧版槸
榪愯 db錛峱repare錛嶏紞銆媎b錛峜reate錛嶏紞銆媎b錛峫oad錛岃繖鏍鋒暟鎹氨寤轟笂浜?br />
鐒跺悗deploy錛屽湪ie涓繍琛宎ppfuse灝眔k浜嗭紒


ibmsoft 2006-08-11 16:44 鍙戣〃璇勮
]]>
use google or baidu get the useful urlhttp://m.tkk7.com/ibmsoft/archive/2006/07/25/60029.htmlibmsoftibmsoftTue, 25 Jul 2006 09:26:00 GMThttp://m.tkk7.com/ibmsoft/archive/2006/07/25/60029.htmlhttp://m.tkk7.com/ibmsoft/comments/60029.htmlhttp://m.tkk7.com/ibmsoft/archive/2006/07/25/60029.html#Feedback0http://m.tkk7.com/ibmsoft/comments/commentRss/60029.htmlhttp://m.tkk7.com/ibmsoft/services/trackbacks/60029.html 聽1/*
聽2聽*聽Copyright聽(c)聽2006聽Your聽Corporation.聽All聽Rights聽Reserved.
聽3*/
聽4package聽liuxuan;
聽5
聽6/**
聽7聽*聽Created聽by聽IntelliJ聽IDEA.
聽8聽*聽User:聽Administrator
聽9聽*聽Date:聽2006-7-26
10聽*聽Time:聽15:33:49
11聽*聽To聽change聽this聽template聽use聽File聽|聽Settings聽|聽File聽Templates.
12*/
13import聽org.htmlparser.Node;
14import聽org.htmlparser.Parser;
15import聽org.htmlparser.http.ConnectionManager;
16import聽org.htmlparser.tags.LinkTag;
17import聽org.htmlparser.util.ParserException;
18import聽org.htmlparser.visitors.ObjectFindingVisitor;
19
20import聽java.sql.Statement;
21import聽java.sql.DriverManager;
22import聽java.sql.Connection;
23import聽java.sql.SQLException;
24
25publicclass聽LinkDemo
26{
27聽聽聽聽publicstaticvoid聽main聽(String[]聽args)聽throws聽ParserException,聽SQLException
28聽聽聽聽{
29聽聽聽聽聽聽聽聽ConnectionManager聽cn聽=new聽ConnectionManager();
30聽聽聽聽聽聽聽聽cn.setProxyHost("10.75.1.38");
31聽聽聽聽聽聽聽聽cn.setProxyPort(80);
32聽聽聽聽聽聽聽聽Parser.setConnectionManager(cn);
33聽聽聽聽聽聽聽聽Parser聽parser;
34聽聽聽聽聽聽聽聽//parser.s
35聽聽聽聽聽聽聽聽String[]聽pyurl聽=new聽String[2]聽;
36
37聽聽聽聽聽聽聽聽pyurl[0]="http://www.google.cn/search?num=100&hl=zh-CN&newwindow=1&q=%E6%BF%AE%E9%98%B3&btnG=%E6%90%9C%E7%B4%A2&meta=cr%3DcountryCN";
38聽聽聽聽聽聽聽聽pyurl[1]="http://www.google.cn/search?q=%E6%BF%AE%E9%98%B3&num=100&hl=zh-CN&lr=&cr=countryCN&newwindow=1&start=100&sa=N";
39聽聽聽聽聽聽聽聽for聽(int聽j=0;j<pyurl.length;j++)聽{
40聽聽聽聽聽聽聽聽聽聽聽聽parser聽=new聽Parser聽(pyurl[j]);
41聽聽聽聽聽聽聽聽聽聽聽聽ObjectFindingVisitor聽visitor聽=new聽ObjectFindingVisitor聽(LinkTag.class);
42聽聽聽聽聽聽聽聽聽聽聽聽parser.visitAllNodesWith聽(visitor);
43聽聽聽聽聽聽聽聽聽聽聽聽Node[]聽links聽=聽visitor.getTags聽();
44聽聽聽聽聽聽聽聽聽聽聽聽String聽sql;
45聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽try聽{
46聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽Class.forName("com.mysql.jdbc.Driver");
47聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽}聽catch聽(ClassNotFoundException聽e)聽{
48聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽e.printStackTrace();聽聽//To聽change聽body聽of聽catch聽statement聽use聽File聽|聽Settings聽|聽File聽Templates.
49聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽}
50聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽Connection聽conn聽=null;
51聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽try聽{
52聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽conn聽=聽DriverManager.getConnection("jdbc:mysql://localhost:3306/crawdb",聽"root",聽"root");
53聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽}聽catch聽(SQLException聽e)聽{
54聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽e.printStackTrace();聽聽//To聽change聽body聽of聽catch聽statement聽use聽File聽|聽Settings聽|聽File聽Templates.
55聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽}
56聽聽聽聽聽聽聽聽聽聽聽聽聽Statement聽stmt聽=聽conn.createStatement();
57聽聽聽聽聽聽聽聽聽聽聽聽for聽(int聽i聽=0;聽i聽<聽links.length;聽i++)
58聽聽聽聽聽聽聽聽聽聽聽聽{
59聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽sql="";
60聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽LinkTag聽linkTag聽=聽(LinkTag)links[i];
61聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽if聽(linkTag.getLink().indexOf("cache")<0&&聽聽linkTag.getLink().indexOf("google")<0&&linkTag.getLinkText().indexOf("嬋槼")>0)聽聽{
62
63
64聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽sql="insert聽into聽urls(name,note,url)聽values('"+linkTag.getLinkText聽()+"','"+"lixuan"+"','"+linkTag.getLink聽()+"')";
65聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽stmt.executeUpdate(sql);
66聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽//rs.close();
67
68聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽System.out.print聽("\""聽+聽linkTag.getLinkText聽()聽+聽"\"聽=>聽");
69聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽System.out.println聽(linkTag.getLink聽());
70聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽}
71聽聽聽聽聽聽聽聽聽聽聽聽}
72聽聽聽聽聽聽聽聽聽聽聽聽聽stmt.close();
73聽聽聽聽聽聽聽聽聽聽聽聽聽conn.close();
74聽聽聽聽聽聽聽聽}
75聽聽聽聽}
76
77}
78


ibmsoft 2006-07-25 17:26 鍙戣〃璇勮
]]>
Nutch Cache Page picture problemhttp://m.tkk7.com/ibmsoft/archive/2006/06/28/55609.htmlibmsoftibmsoftWed, 28 Jun 2006 13:03:00 GMThttp://m.tkk7.com/ibmsoft/archive/2006/06/28/55609.htmlhttp://m.tkk7.com/ibmsoft/comments/55609.htmlhttp://m.tkk7.com/ibmsoft/archive/2006/06/28/55609.html#Feedback0http://m.tkk7.com/ibmsoft/comments/commentRss/55609.htmlhttp://m.tkk7.com/ibmsoft/services/trackbacks/55609.html
  • I use nutch to crawl the intranet.but you know ,the cache.jsp have mang problem (X).Because I filter the gif|jgf and so on
    then I use ORO replace the html content use my customer pif
    Code:
    聽1聽聽聽聽String聽sRegexpSrc="src\\s*=\\s*\"([\\.]*)/([a-z]*)/([^\"]+)";
    聽2聽聽聽聽String聽sRegxpBackground聽="background\\s*=\\s*\"([.]*)/([a-z]*)/([^\"]+)";
    聽3聽聽聽聽String聽sAdd聽="";
    聽4聽聽聽聽String聽sNewContent="";
    聽5聽聽聽聽PatternCompiler聽compiler聽=new聽Perl5Compiler();
    聽6聽聽聽聽Pattern聽pattern聽=null,pattern1聽=null聽;
    聽7聽聽聽聽try{
    聽8聽聽聽聽聽聽聽聽pattern聽=聽compiler.compile(sRegexpSrc,Perl5Compiler.CASE_INSENSITIVE_MASK);
    聽9聽聽聽聽聽聽聽聽pattern1聽=聽compiler.compile(sRegxpBackground,Perl5Compiler.CASE_INSENSITIVE_MASK);
    10聽聽聽聽}
    catch聽(MalformedPatternException聽e){
    11聽聽聽聽聽聽聽聽
    12聽聽聽聽聽聽聽聽e.printStackTrace();
    13聽聽聽聽}

    14聽聽聽聽PatternMatcher聽matcher聽=new聽Perl5Matcher();
    15
    16if聽(matcher.contains(content,聽pattern)){
    17聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽MatchResult聽result聽=聽matcher.getMatch();
    18聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽//System.out.println(result.toString());
    19聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽sAdd聽=聽result.group(1)+"/"+result.group(2)+"/"+result.group(3);
    20聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽//System.out.println("sAdd=聽"+sAdd);
    21聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽sNewContent=content.replaceAll(sAdd,"\\img\\liuxuan");
    22聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽聽//System.out.println("FinalString="+sTest.replaceAll(sAdd,"/img/liuxuan.png"));
    23聽聽聽聽聽聽聽聽聽聽聽聽//System.out.print("sTest=聽"+result.group(1)+"/"+result.group(2));
    24聽聽聽聽聽聽聽聽}
    else{
    25聽聽聽聽聽聽聽聽聽聽聽聽//System.out.print("Can't聽find聽the聽String聽");
    26
    27聽聽聽聽聽聽聽聽}



  • ibmsoft 2006-06-28 21:03 鍙戣〃璇勮
    ]]>
    Java瀹炵幇鍒╃敤鎼滅儲寮曟搸鏀墮泦緗戝潃鐨勭▼搴?/title><link>http://m.tkk7.com/ibmsoft/archive/2006/06/14/52834.html</link><dc:creator>ibmsoft</dc:creator><author>ibmsoft</author><pubDate>Wed, 14 Jun 2006 11:50:00 GMT</pubDate><guid>http://m.tkk7.com/ibmsoft/archive/2006/06/14/52834.html</guid><wfw:comment>http://m.tkk7.com/ibmsoft/comments/52834.html</wfw:comment><comments>http://m.tkk7.com/ibmsoft/archive/2006/06/14/52834.html#Feedback</comments><slash:comments>1</slash:comments><wfw:commentRss>http://m.tkk7.com/ibmsoft/comments/commentRss/52834.html</wfw:commentRss><trackback:ping>http://m.tkk7.com/ibmsoft/services/trackbacks/52834.html</trackback:ping><description><![CDATA[ <table class="blueBox" border="0"> <tbody> <tr> <td width="558"> <div id="m80seyq" class="mainbody"> <div id="ee88ic0" class="blogpost partsmb" id="rtebox" style="PADDING-RIGHT: 0px; PADDING-LEFT: 0px; PADDING-BOTTOM: 0px; MARGIN: 0px; PADDING-TOP: 0px"> <div id="umoyww8" class="MSN_EDITCONTAINER">聽</div> </div> </div> </td> </tr> <tr> <td style="BORDER-RIGHT: rgb(232,232,232) 1px solid; BORDER-LEFT: rgb(232,232,232) 1px solid" align="middle" bgcolor="#f9f9f9" colspan="3"> <table cellspacing="0" cellpadding="0" width="700" align="center" border="0"> <tbody> <tr bgcolor="#f9f9f9"> <td style="LINE-HEIGHT: 200%"> <p>鎴戣繖閲岃鐨勪笉鏄庝箞浣跨敤鎼滅儲寮曟搸錛岃屾槸鎬庝箞璁╃▼搴忓埄鐢ㄦ悳绱㈠紩鎿庢潵鎼滈泦緗戝潃錛岃繖鏈変粈涔堢敤錛熷緢鏈夌敤錛佺綉涓婂姩杈勬湁浜哄彨鍗栫綉鍧鏁版嵁搴擄紝濡傚彂甯冭蔣浠剁綉鍧銆侀偖浠跺湴鍧銆佽鍧涚綉鍧銆佽涓氱綉鍧錛岃繖浜涚綉鍧鏄庝箞鏉ョ殑鍛紵涓嶅彲鑳芥槸浜烘墜宸ユ敹闆嗚屾潵鐨勶紝閮芥槸璁╃▼搴忓埄鐢ㄦ悳绱㈠紩鎿庡彇鍒扮殑錛屽鏋滄偍闇瑕佹煇綾葷綉鍧淇℃伅鏁版嵁錛屽氨璺熸垜鏉ヤ竴璧風爺絀朵竴涓嬶紝闈炲父綆鍗曘?/p> <p>銆銆鏈枃閲囩敤Java璇█鍐欐垚錛屼互google鍜岀櫨搴︽悳绱㈠紩鎿庝負瀵硅薄銆?/p> <p>銆銆鎴戜滑瑕佸埄鐢╣oogle銆佺櫨搴︽悳绱㈠紩鎿庣殑鎼滅儲瑙勫垯涓殑涓ゆ潯錛屽叧閿瓧鎼滅儲鍜宨nurl鎼滅儲銆備粈涔堟槸inurl鎼滅儲錛屽氨鏄綘鎵瑕佹悳绱㈢殑緗戝潃涓湰韜甫鏈夌殑鍏抽敭瀛楋紝姣斿http://www.xxx.com/post.asp ,榪欎釜緗戝潃灝卞惈鏈塸ost.asp榪欐牱鐨勫叧閿瓧錛屽湪鎼滅儲寮曟搸涓~鍐欒鍒欐槸 inurl:post.asp,榪欐槸鏀墮泦緗戝潃鐨勫叧閿紝鍥犱負寰堝緗戝潃鏈韓浼氬甫鏈夌壒瀹氱殑淇℃伅錛屾瘮濡傝蔣浠跺彂甯冪殑緗戦〉緗戝潃淇℃伅涓鍚湁 publish銆乻ubmit銆乼uijian榪欐牱鐨勪俊鎭紝濡俬ttp://www.xxx.com/publish.asp,榪欐牱鐨勭綉鍧澶氭槸鍙戝竷淇℃伅鐨勭綉欏碉紝鍦ㄧ粨鍚堢綉欏典腑鏈韓鍙兘鍚湁鐨勫叧閿瓧錛屽氨鍙互鐢ㄦ悳绱㈠紩鎿庢悳绱㈠嚭緇撴灉錛岀劧鍚庢垜浠埄鐢ㄧ▼搴忓皢緇撴灉鍙栧洖錛屽HTML欏甸潰榪涜鍒嗘瀽錛屽幓闄ゆ病鏈夌敤鐨勪俊鎭紝灝嗘湁鐢ㄧ殑緗戝潃淇℃伅鍐欏叆鏂囦歡鎴栬呮暟鎹簱錛屽氨鍙互緇欏叾瀹冨簲鐢ㄧ▼搴忔垨鑰呬漢鏉ヤ嬌鐢ㄤ簡銆?/p> <p>銆銆絎竴姝ワ紝鐢ㄧ▼搴忓皢鎼滅儲緇撴灉鍙栧洖錛屽厛浠ョ櫨搴︿負渚嬶紝姣斿鎴戜滑瑕佹悳绱㈣蔣浠跺彂甯冪殑緗戦〉錛屽叧閿瓧閲囩敤 鈥滆蔣浠跺彂甯?鐗堟湰 inurl:publish.asp",鍏堢櫥褰曠櫨搴︾湅鐪嬶紝灝嗗叧閿瓧鍐欏叆錛岀劧鍚庢彁浜わ紝鍦ㄥ湴鍧鏍忓氨浼氱湅鍒?http://www.baidu.com/s?ie=gb2312&bs=%C8%ED%BC%FE%B7%A2%B2%BC+%C8%ED%BC%FE%B0%E6%B1%BE+inurl%3Apublish.asp&sr=&z=&cl=3&f=8&wd=%C8%ED%BC%FE%B7%A2%B2%BC+%B0%E6%B1%BE+inurl%3Apublish.asp&ct=0 ,涓枃鍏抽敭瀛楀叏閮藉彉鎴愮紪鐮佷簡錛屾病鏈夊叧緋伙紝鎴戜滑鍦ㄧ▼搴忎腑鐩存帴鐢ㄤ腑鏂囦篃鏄彲浠ョ殑錛屽叾涓涓叧閿瓧鐢紜鍙風浉榪烇紝鍘繪帀涓浜涙病鏈夌敤鐨勪俊鎭紝鎴戜滑鍙互鎶婂湴鍧浼樺寲鎴?http://www.baidu.com/s?lm=0&si=&rn=20&ie=gb2312&ct=0& wd=杞歡鍙戝竷+鐗堟湰+inurl%3Apublish%2Easp&pn=0&cl=0錛屽叾涓璻n琛ㄧず涓欏墊樉紺哄灝戜釜緇撴灉錛寃d=琛ㄧず浣犺鎼滅儲鐨勫叧閿瓧錛宲n琛ㄧず浠庣鍑犳潯寮濮嬫樉紺猴紝榪欎釜pn灝嗘槸鎴戜滑紼嬪簭寰幆鍙栫粨鏋滅殑鍙橀噺錛屾瘡20鏉″驚鐜竴嬈°傛垜浠敤Java鍐欑殑紼嬪簭鏉ユā鎷熻繖涓悳绱㈢殑榪囩▼錛岀敤鍒扮殑鍏抽敭綾諱負 java.net.HttpURLConnection,java.net.URL錛屽厛鍐欎竴涓彁浜ゆ悳绱㈢殑class,鍏抽敭浠g爜濡備笅錛?/p> <p>class Search<br />{<br />銆public URL url;<br />銆public HttpURLConnection http;<br />銆public java.io.InputStream urlstream;<br />銆......<br />銆for(int i=0;i++;i <100)<br />銆{<br />銆銆......<br />銆銆try {<br />銆銆銆url = new URL("www.baidu.com/s?lm=0&si=&rn=20&ie=gb2312&ct=0& wd=杞歡鍙戝竷+鐗堟湰+inurl%3Apublish%2Easp&pn="+beginrecord+"&cl=0");<br />銆銆}catch(Exception ef){};<br />銆銆try {<br />銆銆銆http = (HttpURLConnection) url.openConnection();<br />銆銆銆http.connect();<br />銆銆銆urlstream = http.getInputStream();<br />銆銆}catch(Exception ef){};<br />銆銆java.io.BufferedReader l_reader = new java.io.<br />銆銆BufferedReader(new java.io.InputStreamReader(urlstream));<br />銆銆try {<br />銆銆銆while ((currentLine = l_reader.readLine()) != null) {<br />銆銆銆銆totalstring += currentLine;<br />銆銆銆}<br />銆銆} catch (IOException ex3) {}<br />銆銆....<br />銆銆//鏈鎼滅儲鐨勭粨鏋滃凡緇忔斁鍒皌otalstring涓簡錛屾槸涓浜汬TML浠g爜錛岄渶瑕佷笅涓姝ヨ繘琛屽垎鏋愪簡銆?br />}<br />銆銆鍐嶄互google涓轟緥錛岀◢寰湁浜涗笉鍚岋紝google瀵規祻瑙堝櫒榪涜浜嗕竴浜涙嫻嬶紝緙栫爜涔熶笉鍚岋紝URL涓篽ttp: //www.google.com/search?q=杞歡鍙戝竷+鐗堟湰+inurl:publish.asp&hl=zh-CN&lr= &newwindow=1&start=0&sa=N&ie=UTF-8,鍏朵腑緙栫爜瑕佺敤ie=UTF-8,start琛ㄧず浠庣鍑犳潯璁板綍鏄劇ず錛岄渶瑕佹敞鎰忕殑鏄痝oogle瀵規祻瑙堝櫒榪樿媯鏌ワ紝濡傛灉嫻忚鍣ㄤ笉絎﹀悎瀹冪殑瑕佹眰錛屽皢榪斿洖閿欒浠g爜錛屾墍浠ュ湪妯℃嫙嫻忚鍣ㄦ彁浜や腑錛屾垜浠澶氬姞涓琛屼唬鐮侊紝淇敼鍏抽敭閮ㄥ垎瑕佸皢http灞炴т腑鐨刄ser-Agent璁劇疆涓哄父鐢ㄧ殑嫻忚鍣紝姣斿Mozilla/4.0,浠g爜濡備笅錛?/p> <p>try {<br />銆http = (HttpURLConnection) url.openConnection();<br />銆http.setRequestProperty("User-Agent", "Mozilla/4.0");<br />銆http.connect();<br />銆urlstream = http.getInputStream();<br />}catch(Exception ef){};</p> <p>銆銆絎簩姝ワ紝瀵瑰彇鍥炵殑HTML緙栫爜榪涜鍒嗘瀽錛屽彇鍑哄叾涓殑鏈夌敤緗戝潃淇℃伅錛屽茍鍐欏叆鏂囦歡鎴栬呮暟鎹簱錛岀敱浜庤繖浜涙悳绱㈠紩鎿庨兘鏈夌綉欏靛揩鐓у拰鐩鎬技緗戦〉絳夌綉鍧淇℃伅娣鋒潅鍦℉TML涓紝鎴戜滑瑕佸皢榪欎簺緗戝潃淇℃伅鍓旈櫎鎺夛紝鍓旈櫎鐨勫叧閿氨鏄壘鍑哄叾涓殑瑙勫緥錛岀櫨搴︽悳绱㈠紩鎿庝腑鐨勭綉欏靛揩鐓у拰鍏跺畠娌℃湁鐢ㄧ殑鐨勫湴鍧閮藉惈鏈塨aidu榪欎釜鍏抽敭瀛楋紝鑰実oogle涓惈鏈夌殑鏃犵敤緗戝潃淇℃伅鍚湁鍏抽敭瀛?google鍜宑ache,鎴戜滑灝辨牴鎹繖浜涘叧閿瓧鍓旈櫎鏃犵敤緗戝潃淇℃伅銆傚湪Java涓瀵瑰瓧絎︿覆榪涜鍒嗘瀽蹇呯劧瑕佺敤鍒?java.util.StringTokenize榪欎釜綾伙紝鐢ㄦ潵灝嗗瓧絎︿覆浠ョ壒瀹氱殑鍒嗛殧絎﹀垎寮錛宩ava.util.regex.Pattern鍜?java.util.regex.Matcher鐢ㄦ潵鍖歸厤瀛楃涓詫紝鍏抽敭浠g爜濡備笅錛?/p> <p>class CompareStr<br />{<br />銆public boolean comparestring(String oristring,String tostring)<br />銆{<br />銆銆Pattern p=null; //姝e垯琛ㄨ揪寮?br />銆銆Matcher m=null; //鎿嶄綔鐨勫瓧絎︿覆<br />銆銆boolean b;<br />銆銆p = Pattern.compile(oristring,Pattern.CASE_INSENSITIVE);<br />銆銆m = p.matcher(tostring);<br />銆銆b = m.find();<br />銆銆return b;<br />銆}<br />}</p> <p>class AnalyUrl<br />{<br />銆......<br />銆StringTokenizer token = new StringTokenizer(totalstring," <> \"");<br />銆String firstword;<br />銆CompareStrcompstr = new CompareStr();<br />銆String dsturl = null;<br />銆while (token.hasMoreTokens())<br />銆{<br />銆銆firstword = token.nextToken();<br />銆銆if (!compstr.comparestring("google.com", firstword) && !compstr.comparestring("cache",firstword))<br />銆銆{<br />銆銆銆if (firstword.length() > 7)<br />銆銆銆{<br />銆銆銆銆dsturl = firstword.substring(6,firstword.length() - 1);<br />銆銆銆銆WriteUrl(dsturl); //鎴愬姛鍙栧埌URL錛岃褰曞埌鏂囦歡涓?br />銆銆銆}<br />銆銆}<br />銆}<br />}<br />銆銆閫氳繃浠ヤ笂紼嬪簭錛屾垜浠氨鍙互鏀墮泦鍒拌嚜宸辮鐨勭綉鍧淇℃伅浜嗭紝榪樺彲浠ュ啀鍐欏彟澶栦竴涓簲鐢ㄧ▼搴忥紝瀵規敹闆嗗埌鐨勭綉鍧淇℃伅榪涗竴姝ュ垎鏋愶紝鍙栧嚭鑷繁闇瑕佺殑淇℃伅錛岃繖閲屽氨涓嶅啀绱禈錛岄亾鐞嗛兘鏄竴鏍風殑銆傛渶鍚庨渶璇存槑涓鐐癸紝google鎼滅儲寮曟搸鎼滅儲鎵鑳借繑鍥炵殑緇撴灉涓嶈兘瓚呰繃1000鏉★紝榪囦簡1000鏉★紝灝辯洿鎺ユ彁紺衡滃涓嶈搗錛?Google 涓烘墍鏈夋煡璇㈢殑緇撴灉鏁伴兘涓嶄細瓚呰繃 1000 涓傗濓紝鐧懼害鎼滅儲寮曟搸榪斿洖鐨勭粨鏋滀笉鑳借秴榪?00澶氭潯錛屾墍浠ユ垜浠鎼滅儲鏃跺敖鍙兘澶氬姞鍏抽敭瀛楋紝灝嗙粨鏋滆寖鍥寸緝灝忋?/p> </td> </tr> </tbody> </table> </td> </tr> <tr> <td width="10" height="11"> <img height="11" src="http://www.javafan.net/article/images/u_16.gif" width="10" /> </td> <td style="BORDER-BOTTOM: rgb(232,232,232) 1px solid" width="695" bgcolor="#f9f9f9" height="11"> <img height="1" src="http://www.javafan.net/article/20051223151611967.html" width="1" /> </td> </tr> <div> </div> <div> </div> <div> </div> <div> </div> <div> <div id="o0ouyeo" class="MSN_EDITCONTAINER"> <div id="asiswmk" class="MSN_EDITBOX" contenteditable="true" style="OVERFLOW: auto; WIDTH: 422px; HEIGHT: 44px"> <div>come from </div> <div> <a > <font color="#095801">http://www.javafan.net/article/20051223151611967.html</font> </a> </div> <div> <font color="#095801"> </font>聽</div> <div> <font color="#095801"> </font> </div> </div> </div> </div> </tbody> </table> <img src ="http://m.tkk7.com/ibmsoft/aggbug/52834.html" width = "1" height = "1" /><br><br><div align=right><a style="text-decoration:none;" href="http://m.tkk7.com/ibmsoft/" target="_blank">ibmsoft</a> 2006-06-14 19:50 <a href="http://m.tkk7.com/ibmsoft/archive/2006/06/14/52834.html#Feedback" target="_blank" style="text-decoration:none;">鍙戣〃璇勮</a></div>]]></description></item></channel></rss> <footer> <div class="friendship-link"> <p>感谢您访问我们的网站,您可能还对以下资源感兴趣:</p> <a href="http://m.tkk7.com/" title="亚洲av成人片在线观看">亚洲av成人片在线观看</a> <div class="friend-links"> </div> </div> </footer> 主站蜘蛛池模板: <a href="http://wwwzs88.com" target="_blank">亚洲乱码一二三四五六区</a>| <a href="http://kj555888.com" target="_blank">亚洲日产无码中文字幕</a>| <a href="http://apguangyu.com" target="_blank">亚洲乱码一二三四区麻豆</a>| <a href="http://1992zyzp.com" target="_blank">最近免费mv在线电影</a>| <a href="http://av-fantasy.com" target="_blank">亚洲国产综合专区在线电影</a>| <a href="http://86trader.com" target="_blank">免费久久人人爽人人爽av</a>| <a href="http://usagaa.com" target="_blank">国产亚洲福利精品一区</a>| <a href="http://22youjizz.com" target="_blank">久久免费国产精品一区二区</a>| <a href="http://cao8080.com" target="_blank">久久噜噜噜久久亚洲va久</a>| <a href="http://4438xx21.com" target="_blank">日韩精品人妻系列无码专区免费 </a>| <a href="http://dagongxing.com" target="_blank">一二三四免费观看在线电影</a>| <a href="http://0101av.com" target="_blank">亚洲中字慕日产2021</a>| <a href="http://jyzs888.com" target="_blank">国产AV日韩A∨亚洲AV电影</a>| <a href="http://8mav938.com" target="_blank">日韩视频免费在线</a>| <a href="http://zzz134.com" target="_blank">一级特黄aaa大片免费看</a>| <a href="http://kingleadsw.com" target="_blank">在线观看亚洲天天一三视</a>| <a href="http://www-yhty.com" target="_blank">久久免费区一区二区三波多野</a>| <a href="http://bisi666.com" target="_blank">亚洲视频中文字幕在线</a>| <a href="http://8aa3.com" target="_blank">在线精品免费视频无码的</a>| <a href="http://pite2.com" target="_blank">污网站免费在线观看</a>| <a href="http://qiseka.com" target="_blank">久久精品国产亚洲麻豆</a>| <a href="http://aplus178.com" target="_blank">亚洲人成在线免费观看</a>| <a href="http://chch12.com" target="_blank">亚洲精品国产高清在线观看</a>| <a href="http://33303339.com" target="_blank">亚洲国产高清在线一区二区三区</a>| <a href="http://17soco.com" target="_blank">亚洲第一中文字幕</a>| <a href="http://a666999.com" target="_blank">国产大片线上免费观看</a>| <a href="http://zkqzdq.com" target="_blank">日本系列1页亚洲系列</a>| <a href="http://gwcyy.com" target="_blank">亚洲精品无码久久久影院相关影片</a>| <a href="http://cuitccol.com" target="_blank">人妻无码一区二区三区免费 </a>| <a href="http://591se591se.com" target="_blank">无码少妇精品一区二区免费动态 </a>| <a href="http://gedebai.com" target="_blank">一级毛片一级毛片免费毛片</a>| <a href="http://ydysmedia.com" target="_blank">亚洲一区二区三区高清</a>| <a href="http://doubaye.com" target="_blank">四虎www成人影院免费观看</a>| <a href="http://726kxw.com" target="_blank">一级毛片免费播放男男</a>| <a href="http://www026qqcom.com" target="_blank">久久久久亚洲AV无码网站</a>| <a href="http://jinlaifubuxiugang.com" target="_blank">成年女人午夜毛片免费看</a>| <a href="http://8x8xbu.com" target="_blank">国产高清视频免费在线观看</a>| <a href="http://fenglengqi.com" target="_blank">亚洲第一网站免费视频</a>| <a href="http://gift1town.com" target="_blank">亚洲av无码乱码在线观看野外 </a>| <a href="http://imfever.com" target="_blank">永久在线观看免费视频</a>| <a href="http://z88d.com" target="_blank">亚洲va久久久久</a>| <script> (function(){ var bp = document.createElement('script'); var curProtocol = window.location.protocol.split(':')[0]; if (curProtocol === 'https') { bp.src = 'https://zz.bdstatic.com/linksubmit/push.js'; } else { bp.src = 'http://push.zhanzhang.baidu.com/push.js'; } var s = document.getElementsByTagName("script")[0]; s.parentNode.insertBefore(bp, s); })(); </script> </body>