[转载]获取网络MP3真实地址-Mikel

[转载]获取网络MP3真实地址 – Java综合 – Java – JavaEye论坛.

MP3网站的歌曲链接都采用了不同的加密方法，直接从页面的源文件中是找不到其MP3的网址的。以下有两个public class都可独立运行，只要将其构造方法更名为main方法就可以了，同时还需要在给出的JAVA源代码中找到“//播放或下载代码…”这一行，将其改为“Thread.sleep(200)”延时，否则同一IP频繁的连接请求会遭服务器拒绝或引发服务器的防恶意搜索保护。

1.获取百度新歌MP3真实地址

百度新歌的网址是http://xinge.baidu.com/index.html，打开该页面后用查看源文件，搜索“{sid:”，会看到这样的文本：

http://xinge.baidu.com/index.html的源文件片断

{sid:’468aecfeaabbd9467fb939a2e80da58a.mp3′,al:’今生无缘’,ti:’一天爱一点’,si:’易欣孙莺’,cp:’华友金信子 ‘,da:’2010-08-03′,cv:’38d9e957d5bdfb788989f1eb12239d8f.jpg’,lrc:’b118977f14893a70ab4652031dd1633d.txt’,dl:’511′,tl:’281394′,ico:0}

其中：“sid:”后面是歌曲连接、“al:”后是唱片集、“ti:”后面是歌曲标题、“si:”后面是歌手。

读取“sid:”后面用一对单引号括起来的字符串，在前面加上 http://xinge.baidu.com/wgns/url/构成歌曲的链接，例如：http://xinge.baidu.com/wgns /url/468aecfeaabbd9467fb939a2e80da58a.mp3，这个链接是用于打开试听窗口的。
试听窗口查看不到源文件，那就编程打开这个歌曲链接的网址并解析其源文件。接收到的源文件只有一行，在这一行字符串前面加上http://xinge.baidu.com就是MP3的真实网址了，这个网址可用于播放或下载MP3。

源代码如下：

Java代码

/*
* XingeBaidu.java – 获取’百度新歌’的MP3真实网址
*/
package jmp123.player;
import java.io.BufferedReader;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.URL;
import java.net.HttpURLConnection;
public class XingeBaidu {
public XingeBaidu() {
String strLine;
int beginIndex, endIndex, idx;
System.out.println(“连接到百度新歌\n”);
try {
URL url = new URL(“http://xinge.baidu.com/”);
HttpURLConnection objHttp = (HttpURLConnection) url.openConnection();
objHttp.setRequestProperty(“Connection”, “Keep-Alive”);
InputStream objIS = objHttp.getInputStream();
BufferedReader objReader = new BufferedReader(new InputStreamReader(objIS));
while ((strLine = objReader.readLine()) != null) {
if ((beginIndex = strLine.indexOf(“{sid:”)) != –1) {
if ((idx = strLine.indexOf(“al:”)) != –1
&& (endIndex = strLine.indexOf(“‘,ti”)) != –1
&& idx + 4 < endIndex)
System.out.printf(“[唱片集:%s] “,strLine.substring(idx+4,endIndex));
if ((idx = strLine.indexOf(“ti:”)) != –1
&& (endIndex = strLine.indexOf(“‘,si”)) != –1
&& idx + 4 < endIndex)
System.out.printf(“%s”, strLine.substring(idx + 4,endIndex));
if ((idx = strLine.indexOf(“si:”)) != –1
&& (endIndex = strLine.indexOf(“‘,cp”)) != –1
&& idx + 4 < endIndex)
System.out.printf(” [歌手:%s]”,strLine.substring(idx+4,endIndex));
System.out.printf(“\n”);
if ((endIndex = strLine.indexOf(“.mp3”)) != –1) {
strLine = strLine.substring(beginIndex + 6, endIndex + 4);
getMP3URL(“http://xinge.baidu.com/wgns/url/” + strLine);
}
}
}
} catch (Exception e) {
// e.printStackTrace();
}
}
private void getMP3URL(String surl) throws Exception {
String strLine;
URL url = new URL(surl);
HttpURLConnection objHttp = (HttpURLConnection) url.openConnection();
InputStream objIS = objHttp.getInputStream();
BufferedReader objReader = new BufferedReader(new InputStreamReader(objIS));
if ((strLine = objReader.readLine()) != null) {
strLine = “http://xinge.baidu.com” + strLine;
System.out.println(strLine); //打印查找到的MP3的真实网址
//播放或下载的代码…
}
objHttp.disconnect();
objHttp = null;
objReader.close();
objReader = null;
url = null;
}
}

/*
 * XingeBaidu.java - 获取'百度新歌'的MP3真实网址
 */
package jmp123.player;

import java.io.BufferedReader;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.net.URL;
import java.net.HttpURLConnection;

public class XingeBaidu {
	public XingeBaidu() {
		String strLine;
		int beginIndex, endIndex, idx;
		System.out.println("连接到百度新歌\n");

		try {
			URL url = new URL("http://xinge.baidu.com/");
			HttpURLConnection objHttp = (HttpURLConnection) url.openConnection();
			objHttp.setRequestProperty("Connection", "Keep-Alive");
			InputStream objIS = objHttp.getInputStream();
			BufferedReader objReader = new BufferedReader(new InputStreamReader(objIS));

			while ((strLine = objReader.readLine()) != null) {
				if ((beginIndex = strLine.indexOf("{sid:")) != -1) {
					if ((idx = strLine.indexOf("al:")) != -1
							&& (endIndex = strLine.indexOf("',ti")) != -1
							&& idx + 4 < endIndex)
						System.out.printf("[唱片集:%s]  ",strLine.substring(idx+4,endIndex));
					if ((idx = strLine.indexOf("ti:")) != -1
							&& (endIndex = strLine.indexOf("',si")) != -1
							&& idx + 4 < endIndex)
						System.out.printf("%s", strLine.substring(idx + 4,endIndex));
					if ((idx = strLine.indexOf("si:")) != -1
							&& (endIndex = strLine.indexOf("',cp")) != -1
							&& idx + 4 < endIndex)
						System.out.printf("  [歌手:%s]",strLine.substring(idx+4,endIndex));
					System.out.printf("\n");

					if ((endIndex = strLine.indexOf(".mp3")) != -1) {
						strLine = strLine.substring(beginIndex + 6, endIndex + 4);
						getMP3URL("http://xinge.baidu.com/wgns/url/" + strLine);
					}
				}
			}
		} catch (Exception e) {
			// e.printStackTrace();
		}
	}

	private void getMP3URL(String surl) throws Exception {
		String strLine;
		URL url = new URL(surl);
		HttpURLConnection objHttp = (HttpURLConnection) url.openConnection();

		InputStream objIS = objHttp.getInputStream();
		BufferedReader objReader = new BufferedReader(new InputStreamReader(objIS));

		if ((strLine = objReader.readLine()) != null) {
			strLine = "http://xinge.baidu.com" + strLine;
			System.out.println(strLine); //打印查找到的MP3的真实网址
			//播放或下载的代码...
		}
		objHttp.disconnect();
		objHttp = null;
		objReader.close();
		objReader = null;
		url = null;
	}
}

2.获取搜狗MP3真实网址

用上面的方法不能获取搜狗新歌100等的MP3真实网址，原因可能是其服务器有更严格的限制，防止用上面的方法去恶意搜索。前两天调试代码时连接上去，接收到的页面源文件中提示输入验证码，所以就不能用程序去解析其MP3网址了，晕，接连两天都不行，不知道是前两天调试程序连接的太频繁了还是别的什么原因，触发了网站的防恶意搜索保护。

http://music.sogou.com/song/newtop_1.html源文件片断

源代码如下，自己对比一下，就能琢磨出与第一种方法有什么不同了。总的步骤是一样的，仍是两步：

连接到http://music.sogou.com/song/newtop_1.html从接收到的数据流中查找到歌曲链接。打开这个页面的源文件，查找到window.open(，它后面用一对单引号括起来的内容就是歌曲的链接，这个链接是用于打开试听窗口的。
用程序连接到这个歌曲链接，从接收到的数据流中查找以http://开头、以.mp3结尾的字符串，这个字符串就是MP3的真实网址。

Java代码

/*
* SogouNewTop.java – 获取’搜狗音乐新歌TOP100’的MP3真实网址
*/
package jmp123.player;
import java.io.IOException;
import java.io.PrintWriter;
import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.Socket;
/**
* 创建、发送HTTP请求头
*/
class MySocket {
private String strReferer;
private Socket socket;
private PrintWriter pwOut;
BufferedReader brIn;
public MySocket(String strReferer) {
this.strReferer = strReferer;
}
public void create(String surl) {
int beginIndex, endIndex, iPort = 80;
String strHost = surl.substring(7);
endIndex = strHost.indexOf(“/”);
String strPath = strHost.substring(endIndex);
strHost = strHost.substring(0, endIndex);
if( (beginIndex = strHost.indexOf(“:”)) != –1) {
if(endIndex – beginIndex > 1)
iPort = Integer.parseInt(strHost.substring(beginIndex+1, endIndex));
strHost = strHost.substring(0, beginIndex);
}
try {
socket = new Socket(strHost, iPort);
pwOut = new PrintWriter(socket.getOutputStream(), true);
// 构建HTTP请求头
pwOut.println(“GET “ + strPath + ” HTTP/1.1″);
pwOut.println(“Host:” + strHost);
pwOut.println(“Referer:” + strReferer);
pwOut.println(“Accept:*/*”);
pwOut.println(“User-Agent:Mozilla/5.0 (compatible; MSIE 6.0; Windows NT 5.2; SV1; .NET CLR 1.1.4322)”);
pwOut.println(“Connection: Keep-Alive”);
pwOut.println();
// 调用socket.getInputStream方法时才发送HTTP请求头
brIn = new BufferedReader(new InputStreamReader(socket.getInputStream()));
} catch (IOException e) {
System.out.println(“创建套接字/输入流错误。”);
System.exit(1);
}
}
public BufferedReader getBufferedReader() {
return brIn;
}
public void close() {
try {
brIn.close();
pwOut.close();
socket.close();
} catch (IOException e) {
System.out.println(“关闭套接字错误。”);
System.exit(1);
}
}
}
/**
* 解析搜狗音乐新歌TOP100页面获取MP3真实网址。
*/
public class SogouNewTop {
private static final String strReferer = “http://music.sogou.com/song/newtop_1.html”;
private MySocket htmlSocket = new MySocket(strReferer);
private MySocket urlSocket = new MySocket(strReferer);
/*
* 查找页面的歌曲链接
*/
public SogouNewTop() throws Exception {
System.out.println(“连接到搜狗音乐新歌TOP100\n”);
String strline = “”;
htmlSocket.create(strReferer);
BufferedReader brIn = htmlSocket.getBufferedReader();
int beginIndex, endIndex;
while ((strline = brIn.readLine()) != null) {
// 1.查找歌曲名(可省略)
if ((beginIndex = strline.indexOf(“consume=phb_song”)) != –1 ) {
strline = strline.substring(beginIndex);
if ((beginIndex = strline.indexOf(“>”)) != –1
&& (endIndex = strline.indexOf(“<“)) != –1) {
strline = strline.substring(beginIndex+1, endIndex);
System.out.println(“[歌曲名] “ + strline);
}
continue;
}
// 2.查找歌曲链接
if ((beginIndex = strline.indexOf(“onclick=\”window.open(“)) != –1
&& (beginIndex = strline.indexOf(“http://mp3.sogou.com/down.so”)) != –1
&& (endIndex = strline.indexOf(“‘,”)) != –1) {
strline = strline.substring(beginIndex, endIndex);
getMP3URL(strline);
}
}
htmlSocket.close();
}
/**
* 分析歌曲链接找到其真实网址
*/
private void getMP3URL(String surl) throws Exception {
String strline = “”;
urlSocket.create(surl);
BufferedReader brIn = urlSocket.getBufferedReader();
int beginIndex, endIndex;
while ((strline = brIn.readLine()) != null) {
if ((beginIndex = strline.indexOf(“http://”)) != –1
&& (endIndex = strline.indexOf(“.mp3”)) != –1) {
strline = strline.substring(beginIndex, endIndex + 4);
System.out.println(strline); //打印MP3的真实地址
//播放或下载的代码放这……;
break;
}
}
urlSocket.close();
}
}

/*
 * SogouNewTop.java - 获取'搜狗音乐新歌TOP100'的MP3真实网址
 */
package jmp123.player;

import java.io.IOException;
import java.io.PrintWriter;
import java.io.BufferedReader;
import java.io.InputStreamReader;
import java.net.Socket;

/**
 * 创建、发送HTTP请求头
 */
class MySocket {
	private String strReferer;
	private Socket socket;
	private PrintWriter pwOut;
	BufferedReader brIn;

	public MySocket(String strReferer) {
		this.strReferer = strReferer;
	}

	public void create(String surl) {
		int beginIndex, endIndex, iPort = 80;
		String strHost = surl.substring(7);
		endIndex = strHost.indexOf("/");
		String strPath = strHost.substring(endIndex);
		strHost = strHost.substring(0, endIndex);
		if( (beginIndex = strHost.indexOf(":")) != -1) {
			if(endIndex - beginIndex > 1)
				iPort = Integer.parseInt(strHost.substring(beginIndex+1, endIndex));
			strHost = strHost.substring(0, beginIndex);
		}

		try {
			socket = new Socket(strHost, iPort);
			pwOut = new PrintWriter(socket.getOutputStream(), true);

			// 构建HTTP请求头
			pwOut.println("GET " + strPath + " HTTP/1.1");
			pwOut.println("Host:" + strHost);
			pwOut.println("Referer:" + strReferer);
			pwOut.println("Accept:*/*");
			pwOut.println("User-Agent:Mozilla/5.0 (compatible; MSIE 6.0; Windows NT 5.2; SV1; .NET CLR 1.1.4322)");
			pwOut.println("Connection: Keep-Alive");
			pwOut.println();

			// 调用socket.getInputStream方法时才发送HTTP请求头
			brIn = new BufferedReader(new InputStreamReader(socket.getInputStream()));
		} catch (IOException e) {
			System.out.println("创建套接字/输入流错误。");
			System.exit(1);
		}
	}

	public BufferedReader getBufferedReader() {
		return brIn;
	}

	public void close() {
		try {
			brIn.close();
			pwOut.close();
			socket.close();
		} catch (IOException e) {
			System.out.println("关闭套接字错误。");
			System.exit(1);
		}
	}
}

/**
 * 解析搜狗音乐新歌TOP100页面获取MP3真实网址。
 */
public class SogouNewTop {
	private static final String strReferer = "http://music.sogou.com/song/newtop_1.html";
	private MySocket htmlSocket = new MySocket(strReferer);
	private MySocket urlSocket = new MySocket(strReferer);

	/*
	 * 查找页面的歌曲链接
	 */
	public SogouNewTop() throws Exception {
		System.out.println("连接到搜狗音乐新歌TOP100\n");
		String strline = "";
		htmlSocket.create(strReferer);
		BufferedReader brIn = htmlSocket.getBufferedReader();
		int beginIndex, endIndex;

		while ((strline = brIn.readLine()) != null) {
			// 1.查找歌曲名(可省略)
			if ((beginIndex = strline.indexOf("consume=phb_song")) != -1 ) {
				strline = strline.substring(beginIndex);
				if ((beginIndex = strline.indexOf(">")) != -1
						&& (endIndex = strline.indexOf("<")) != -1) {
					strline = strline.substring(beginIndex+1, endIndex);
					System.out.println("[歌曲名] " + strline);
				}
				continue;
			}

			// 2.查找歌曲链接
			if ((beginIndex = strline.indexOf("onclick=\"window.open(")) != -1
					&& (beginIndex = strline.indexOf("http://mp3.sogou.com/down.so")) != -1
					&& (endIndex = strline.indexOf("',")) != -1) {
				strline = strline.substring(beginIndex, endIndex);
				getMP3URL(strline);
			}
		}
		htmlSocket.close();
	}

	/**
	 * 分析歌曲链接找到其真实网址
	 */
	private void getMP3URL(String surl) throws Exception {
		String strline = "";
		urlSocket.create(surl);
		BufferedReader brIn = urlSocket.getBufferedReader();
		int beginIndex, endIndex;

		while ((strline = brIn.readLine()) != null) {
			if ((beginIndex = strline.indexOf("http://")) != -1
					&& (endIndex = strline.indexOf(".mp3")) != -1) {
				strline = strline.substring(beginIndex, endIndex + 4);
				System.out.println(strline);	//打印MP3的真实地址
				//播放或下载的代码放这......;
				break;
			}
		}

		urlSocket.close();
	}
}

另外，http://mp3.sogou.com/的：

歌曲TOP100　http://music.sogou.com/song/topsong.html
单曲抢先听　http://music.sogou.com/song/newnew_1.html
劲爆dj音乐榜　http://music.sogou.com/song/newdj_1
欧美流行榜　http://music.sogou.com/song/enpop_1.html

等页面的搜索方法跟上面的是一样的，并不建议你写代码到 http://music.sogou.com/song/目录下搜索*.html并用上述方法解析（就是实现传说中的网络蜘蛛的一部分功能），这样一顿海搜不礼貌哈，别人藏着掖着的就是不想让你查找到其MP3的网址的嘛。这些页面上的歌曲经常更新，固定查找某一页面的MP3也可以听到新歌，不错了。一边干活一边听听歌，挺不错的哦~~

MP3网站的加密方法经常变更，到目前为止这种方法可用，不能保证一直可用。应用示例到我的主页http://jmp123.sf.net/ 下载最新的MP3播放程序，程序（jar包）用法见其中的readme.txt。

[转载]获取网络MP3真实地址

相关推荐

热门标签

分类

链接表

觉得文章有用就打赏一下文章作者

支付宝扫一扫打赏

微信扫一扫打赏