閱讀406 返回首頁    go 技術社區[雲棲]


使用正則表達式和REPLACE,SPLIT獲得7,8,9天單個城市天氣情況抓取解析代碼

代碼寫的很淩亂,正則用得也不是很好,不過還是實現了功能,貼出代碼


package com.zzk.cn;

import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.MalformedURLException;
import java.net.URL;
import java.net.URLConnection;
import java.util.regex.Matcher;
import java.util.regex.Pattern;


public class TestSpider {

	public static void main(String[] args) {
		URL url = null;
		URLConnection conn = null;
		InputStream in = null;
		InputStreamReader isr = null;
		BufferedReader br = null;
		try {
			url = new URL("https://www.haotq.com/d_anqing.html");
			conn = url.openConnection();
			in = conn.getInputStream();
			isr = new InputStreamReader(in);
			br = new BufferedReader(isr);
			String line = "";
			String info="";
			while (null != (line = br.readLine())) {
				//System.out.println(line);
				info+=line;
			}
		
			//System.out.println(info);
			Pattern p=Pattern.compile("div\\sid=.weather_day_brief.*?</div>");//正則獲取網頁大致信息

			Matcher m=p.matcher(info);
			String s1="";
	    	while(m.find()) {
	    		s1=m.group();
	    		//System.out.println(s1);
	    	}
	    	
	    	String s2="";
	        Pattern p1=Pattern.compile("<br>.*<script");//正則根據br獲取7,8,9天的天氣信息
	    	//Pattern p1=Pattern.compile("<(/?\\s?br\\b)>");
	    	Matcher m1=p1.matcher(s1);
	    	while(m1.find()) {
	    		//System.out.println(m1.group());
	    	    s2=m1.group();
	    	}
			
	    	String[] sPlit=s2.split("<br>"); 

	    	int i=s2.length(); 
	    		String t1="";
	    		String t2="";
	    		String t3="";
	    		t1=sPlit[7];
	    		t2=sPlit[8];
	    		t3=sPlit[9];
	    		System.out.println(t1);//7天後天氣
	    		System.out.println(t2);//8天後天氣
	    		System.out.println(t3);//9天後天氣
	    	
	    	
	    		//天氣
	    	String[] sPlit1=t1.split(" "); 
	    	int i1=t1.length();
	    	System.out.println(sPlit1[1]);//白天陣雨,夜間陣雨,
	    	System.out.println(sPlit1[2]);//氣溫2℃~9℃
	    	System.out.println(sPlit1[3]);//北偏東風 二級
	    	
	    	String w1="";
	    	String w2="";
	    	String w3="";
	    	w1=sPlit1[1];
	    	String[] sPlit4=w1.split(",");
	    	String weather_title71=sPlit4[0].replace("白天", "");//第七天的白天的字段
	    	String weather_title72=sPlit4[1].replace("夜間", "");//第七天的夜晚的字段
            System.out.println(weather_title71);//第七天的白天天氣情況
            System.out.println(weather_title72);//第七天的夜晚天氣情況
	    	
	    	w2=sPlit1[2];
	    	String[] sPlit5=w2.split("~");
	    	String weather_temp71=sPlit5[0].replace("氣溫", "");
	    	String weather_temp72=sPlit5[1].replace("~", "").replace(",", "");
	    	System.out.println(weather_temp71);//第七天的最低氣溫
	    	System.out.println(weather_temp72);//第七天的最高氣溫
	    	
	    	w3=sPlit1[3];
	    	String[] sPlit6=w3.split(" ");
	    	String weather_winddirection71=sPlit6[0];
	    	String weather_windpower71=sPlit6[1];
	    	System.out.println(weather_winddirection71);//第七天的風向
	    	System.out.println(weather_windpower71);//第七天的風力
	    	
	    	String[] sPlit2=t2.split(" "); 
	    	int i2=t2.length();
	    	
	    	String w4="";
	    	String w5="";
	    	String w6="";
	    	w4=sPlit2[1];
	    	String[] sPlit7=w4.split(",");
	    	String weather_title81=sPlit7[0].replace("白天", "");//第八天的白天的字段
	    	String weather_title82=sPlit7[1].replace("夜間", "");//第八天的夜晚的字段
            System.out.println(weather_title81);//第八天的白天天氣情況
            System.out.println(weather_title82);//第八天的夜晚天氣情況
	    	
	    	w5=sPlit2[2];
	    	String[] sPlit8=w5.split("~");
	    	String weather_temp81=sPlit8[0].replace("氣溫", "");
	    	String weather_temp82=sPlit8[1].replace("~", "").replace(",", "");
	    	System.out.println(weather_temp81);//第八天的最低氣溫
	    	System.out.println(weather_temp82);//第八天的最高氣溫
	    	
	    	w6=sPlit2[3];
	    	String[] sPlit9=w6.split(" ");
	    	String weather_winddirection81=sPlit9[0];
	    	String weather_windpower81=sPlit9[1];
	    	System.out.println(weather_winddirection81);//第八天的風向
	    	System.out.println(weather_windpower81);//第八天的風力
	    	
	    	
	    	String[] sPlit3=t3.split(" "); 
	    	int i3=t3.length();
	    	System.out.println(sPlit3[1]);
	    	System.out.println(sPlit3[2]);
	    	System.out.println(sPlit3[3]);
	    	
	    	String w7="";
	    	String w8="";
	    	String w9="";
	    	w7=sPlit3[1];
	    	String[] sPlit10=w7.split(",");
	    	String weather_title91=sPlit10[0].replace("白天", "");//第九天的白天的字段
	    	String weather_title92=sPlit10[1].replace("夜間", "");//第九天的夜晚的字段
            System.out.println(weather_title91);//第九天的白天天氣情況
            System.out.println(weather_title92);//第九天的夜晚天氣情況
	    	
	    	w8=sPlit3[2];
	    	String[] sPlit11=w8.split("~");
	    	String weather_temp91=sPlit11[0].replace("氣溫", "");
	    	String weather_temp92=sPlit11[1].replace("~", "").replace(",", "");
	    	System.out.println(weather_temp91);//第九天的最低氣溫
	    	System.out.println(weather_temp92);//第九天的最高氣溫
	    	
	    	w9=sPlit3[3];
	    	String[] sPlit12=w9.split(" ");
	    	String weather_winddirection91=sPlit12[0];
	    	String weather_windpower91=sPlit12[1].replace("<script", "");
	    	System.out.println(weather_winddirection91);//第九天的風向
	    	System.out.println(weather_windpower91);//第九天的風力
	    			
		} catch (MalformedURLException e) {
			e.printStackTrace();
		} catch (IOException e) {
			e.printStackTrace();
		} finally {
			try {
				if (null != br) {
					br.close();
				}
			} catch (IOException e) {
				e.printStackTrace();
			}
			br = null;

			try {
				if (null != isr) {
					isr.close();
				}
			} catch (IOException e) {
				e.printStackTrace();
			}
			isr = null;

			try {
				if (null != in) {
					in.close();
				}
			} catch (IOException e) {
				e.printStackTrace();
			}
			in = null;
		}

	}
}

輸出:

7天後安慶天氣:&nbsp;白天陣雨,夜間陣雨,&nbsp;氣溫2℃~9℃,&nbsp;北偏東風 二級
8天後安慶天氣:&nbsp;白天陣雨,夜間陣雨,&nbsp;氣溫-1℃~7℃,&nbsp;北偏東風 二級
9天後安慶天氣:&nbsp;白天局部多雲,夜間局部多雲,&nbsp;氣溫-1℃~8℃,&nbsp;北偏東風 二級<script
白天陣雨,夜間陣雨,
氣溫2℃~9℃,
北偏東風 二級
陣雨
陣雨
2℃
9℃
北偏東風
二級
陣雨
陣雨
-1℃
7℃
北偏東風
二級
白天局部多雲,夜間局部多雲,
氣溫-1℃~8℃,
北偏東風 二級<script
局部多雲
局部多雲
-1℃
8℃
北偏東風
二級





















最後更新:2017-04-02 06:52:15

  上一篇:go 如何精確地測量java對象的大小-底層instrument API
  下一篇:go android中Parcel中文亂碼的解決:巧用十六進製