Jsoup解析html终于成功了!!!
package com.eric.pickupjoke.activity; import java.io.IOException;
import java.io.InputStream;
import java.util.ArrayList;
import java.util.Calendar;
import java.util.HashMap;
import java.util.List;
import java.util.Locale;
import java.util.Map; import org.apache.http.HttpResponse;
import org.apache.http.HttpStatus;
import org.apache.http.client.ClientProtocolException;
import org.apache.http.client.HttpClient;
import org.apache.http.client.methods.HttpGet;
import org.apache.http.impl.client.DefaultHttpClient;
import org.apache.http.util.EntityUtils;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.nodes.TextNode;
import org.jsoup.select.Elements; import android.app.Activity;
import android.graphics.drawable.ColorDrawable;
import android.os.AsyncTask;
import android.os.Bundle;
import android.util.Log;
import android.view.Menu;
import android.widget.SimpleAdapter;
import android.widget.Toast; import com.eric.pickupjoke.conn.IsConnection;
import com.eric.pickupjoke.listview.MyListView;
import com.eric.pickupjoke.listview.MyListView.OnMoreListener;
import com.eric.pickupjoke.listview.MyListView.OnRefreshListener; public class AdultJokeActivity extends Activity {
MyListView articleListView;
List<HashMap<String, String>> articleList;
SimpleAdapter adapter;
OnRefreshListener mOnRefreshListener;
OnMoreListener mOnMoreListener;
static int index = 2; @Override
protected void onCreate(Bundle savedInstanceState) {
super.onCreate(savedInstanceState);
setContentView(R.layout.activity_adult_joke);
init();
} void init() {
getWindow().setBackgroundDrawable(new ColorDrawable(-1));
articleListView = (MyListView) findViewById(R.id.article_list_view);
articleList = new ArrayList<HashMap<String, String>>();
InputStream is;
try {
is = this.getResources().getAssets().open("source_html.html");
Document doc = Jsoup.parse(is, "GBK", "http://www.haha365.com");
Log.i("AsyncTask in AdultJokeActivity", "5");
Elements twoArticleElements = doc
.select("div.content>div.left>div.r_c>div.cat_llb");
Log.i("AsyncTask in AdultJokeActivity", "6");
if (twoArticleElements != null && twoArticleElements.size() > 0) {
for (Element twoArticleElement : twoArticleElements) {
Log.i("AsyncTask in AdultJokeActivity", "7");
List<TextNode> textList = twoArticleElement.textNodes();
Map<String, String> map1 = new HashMap<String, String>();
Map<String, String> map2 = new HashMap<String, String>();
Log.i("AsyncTask in AdultJokeActivity", "8");
map1.put("time", textList.get(0).text());
map1.put("title", twoArticleElement.child(1).text());
map1.put("content", twoArticleElement.child(3).text());
map2.put("time", textList.get(4).text());
map2.put("title", twoArticleElement.child(6).text());
map2.put("content", twoArticleElement.child(8).text());
Log.i("AsyncTask in AdultJokeActivity", "9");
articleList.add((HashMap<String, String>) map1);
articleList.add((HashMap<String, String>) map2);
Log.i("AsyncTask in AdultJokeActivity", "10");
}
}
} catch (IOException e) {
e.printStackTrace();
}
Log.i("init() in AdultJokeActivity", "1");
adapter = new SimpleAdapter(this, articleList,
R.layout.article_list_item, new String[] { "title", "content",
"time" }, new int[] { R.id.title, R.id.content,
R.id.time });
articleListView.setAdapter(adapter);
Log.i("init() in AdultJokeActivity", "2"); mOnRefreshListener = new OnRefreshListener() {
@Override
public void onRefresh() {
Log.i("onRefresh in AdultJokeActivity", "1");
if (new IsConnection(AdultJokeActivity.this).isConnected()) {
new LoadArticleTask()
.execute("http://www.haha365.com/Adult_joke/"); }
}
};
mOnMoreListener = new OnMoreListener() {
@Override
public void onMore() {
Log.i("onMore in AdultJokeActivity", "1");
if (new IsConnection(AdultJokeActivity.this).isConnected()
&& index <= 18) {
new LoadArticleTask()
.execute("http://www.haha365.com/Adult_joke/index_"
+ String.valueOf(index) + ".htm");
index++;
} }
};
articleListView.setOnRefreshListener(mOnRefreshListener);
articleListView.setOnMoreListener(mOnMoreListener);
} private class LoadArticleTask extends AsyncTask<String, Void, String> {
@Override
protected String doInBackground(String... urls) {
try {
Log.i("AsyncTask in AdultJokeActivity", "1");
HttpClient httpClient = new DefaultHttpClient();
HttpGet httpGet = new HttpGet(urls[0]);
HttpResponse httpResponse = httpClient.execute(httpGet);
Log.i("AsyncTask in AdultJokeActivity", "2");
if (httpResponse.getStatusLine().getStatusCode() == HttpStatus.SC_OK) {
Log.i("AsyncTask in AdultJokeActivity", "3");
String html = EntityUtils.toString(
httpResponse.getEntity(), "GBK");
// System.out.println(html);
Log.i("AsyncTask in AdultJokeActivity", "4");
return html;
} else {
Toast.makeText(AdultJokeActivity.this, "获取HTML文档失败",
Toast.LENGTH_SHORT).show();
return null;
}
} catch (ClientProtocolException e) {
e.printStackTrace();
return null;
} catch (IOException e) {
e.printStackTrace();
return null;
}
} @Override
protected void onPostExecute(String html) {
Document doc = Jsoup.parse(html);
Log.i("AsyncTask in AdultJokeActivity", "5");
Elements twoArticleElements = doc
.select("div.content>div.left>div.r_c>div.cat_llb");
Log.i("AsyncTask in AdultJokeActivity", "6");
if (twoArticleElements != null && twoArticleElements.size() > 0) {
for (Element twoArticleElement : twoArticleElements) {
Log.i("AsyncTask in AdultJokeActivity", "7");
List<TextNode> textList = twoArticleElement.textNodes();
Map<String, String> map1 = new HashMap<String, String>();
Map<String, String> map2 = new HashMap<String, String>();
Log.i("AsyncTask in AdultJokeActivity", "8");
map1.put("time", textList.get(0).text());
map1.put("title", twoArticleElement.child(1).text());
map1.put("content", twoArticleElement.child(3).text());
map2.put("time", textList.get(4).text());
map2.put("title", twoArticleElement.child(6).text());
map2.put("content", twoArticleElement.child(8).text());
Log.i("AsyncTask in AdultJokeActivity", "9");
articleList.add((HashMap<String, String>) map1);
articleList.add((HashMap<String, String>) map2);
Log.i("AsyncTask in AdultJokeActivity", "10");
}
} else {
Log.i("AsyncTask in AdultJokeActivity", "8");
}
adapter.notifyDataSetChanged();
articleListView.onRefreshComplete("更新时间:" + getCalendarString());
articleListView.onMoreComplete();
Log.i("AsyncTask in AdultJokeActivity", "11");
}
} @Override
public boolean onCreateOptionsMenu(Menu menu) {
// Inflate the menu; this adds items to the action bar if it is present.
getMenuInflater().inflate(R.menu.adult_joke, menu);
return true;
} public String getCalendarString() {
Calendar c = Calendar.getInstance(Locale.CHINA);
int mHour = c.get(Calendar.HOUR_OF_DAY);
int mMinter = c.get(Calendar.MINUTE);
return String.valueOf(mHour) + ":" + String.valueOf(mMinter);
} }
Jsoup解析html终于成功了!!!的更多相关文章
- 一步步教你为网站开发Android客户端---HttpWatch抓包,HttpClient模拟POST请求,Jsoup解析HTML代码,动态更新ListView
本文面向Android初级开发者,有一定的Java和Android知识即可. 文章覆盖知识点:HttpWatch抓包,HttpClient模拟POST请求,Jsoup解析HTML代码,动态更新List ...
- Android利用Jsoup解析html 开发网站客户端小记。
这些天业余时间比较多,闲来无事,想起了以前看过开发任意网站客户端的一篇文章,就是利用jsoup解析网站网页,通过标签获取想要的内容.好了废话不多说,用到的工具为 jsoup-1.7.2.jar包,具体 ...
- [java] jsoup 解析网页获取省市区域信息
到国家统计局抓取数据, 到该class下解析数据 /** * jsoup解析网页 * @author xwolf * @date 2016-12-13 18:11 * @since V1.0.0 */ ...
- jsoup解析HTML及简单实例
jsoup 中文参考文献 http://www.open-open.com/jsoup/ 本文将利用jsoup,简单实现网络抓取的功能,并给出一个小实例,该实例效果为:获取作者本人在博客园写的所 ...
- jsoup解析HTML
Connection conn = Jsoup.connect(String url); conn.data("txtBill", key);// 设置关键字查询字段 Docume ...
- Android开发探秘之三:利用jsoup解析HTML页面
这节主要是讲解jsoup解析HTML页面.由于在android开发过程中,不可避免的涉及到web页面的抓取,解析,展示等等,所以,在这里我主要展示下利用jsoup jar包来抓取cnbeta.com网 ...
- 终于成功仿了一次Kalman滤波器
终于成功仿了一次Kalman滤波器 首先是测试了从网上down的一段代码 % KALMANF - updates a system state vector estimate based upon a ...
- Jsoup 解析 HTML
Jsoup 文档 方法 要取得一个属性的值,可以使用Node.attr(String key) 方法 对于一个元素中的文本,可以使用Element.text()方法 对于要取得元素或属性中的HTML内 ...
- Jsoup解析HTML、加载文档等实例
一.引入jsoup的jar包:http://jsoup.org/download 补充:http://jsoup.org/apidocs/ Jsoup API 可以了解更详细的内容 二.Js ...
随机推荐
- Java中的网络编程
Java中的网路编程主要是Java的Socket编程,属于JavaEE中的高级的部分,以下内容是对java网路编程的一个小结,代码都是经过编译调试的 C/S程序应用:客户/服务器模式,如QQ客户端 ...
- 如何高效地向Redis插入大量的数据
最近有个哥们在群里问,有一个日志,里面存的是IP地址(一行一个),如何将这些IP快速导入到Redis中. 我刚开始的建议是Shell+redis客户端. 今天,查看Redis官档,发现文档的首页部分( ...
- 不要给<a>设置outline:none
outline属性有什么作用 原文链接 a{outline:none} do not do it 当用户使用tab键进行链接切换时,该属性会在当前选中的链接(获得焦点)使用该属性,一般来说是虚线框 的 ...
- 1Z0-053 争议题目解析24
1Z0-053 争议题目解析24 考试科目:1Z0-053 题库版本:V13.02 题库中原题为: 24.Which of the following information will be gath ...
- MySQL入门01-MySQL源码安装
操作系统:CentOS 6.7 MySQL版本:5.6.30 1.前期准备 2.系统配置 3.CMake编译配置 4.make && make install 5.后期配置和测试 Re ...
- JavaWeb学习总结(五十二)——使用JavaMail创建邮件和发送邮件
一.RFC882文档简单说明 RFC882文档规定了如何编写一封简单的邮件(纯文本邮件),一封简单的邮件包含邮件头和邮件体两个部分,邮件头和邮件体之间使用空行分隔. 邮件头包含的内容有: from字段 ...
- spring boot 配置启动后执行sql, 中文乱码
spring.datasource.schema指定启动后执行的sql文件位置. 我发现中文乱码,原因是没有指定执行sql script encoding: spring: datasource: u ...
- 基于OpenSLL的RSA加密应用(非算法)
基于OpenSLL的RSA加密应用(非算法) iOS开发中的小伙伴应该是经常用der和p12进行加密解密,而且在通常加密不止一种加密算法,还可以加点儿盐吧~本文章主要阐述的是在iOS中基于openSL ...
- 自己封装的一个JS分享组件
因为工作的需求之前也封装过一个JS分享插件,集成了我们公司常用的几个分享平台. 但是总感觉之前的结构上很不理想,样式,行为揉成一起,心里想的做的完美,实际上总是很多的偏差,所以这次我对其进行了改版. ...
- Windows 10预览版14316开启Bash命令支持
00x0 前言 4月7日凌晨,微软推送了最新的Windows 10一周年更新预览版14316,其中重要的是原生支持Linux Bash命令行支持. 00x1 问题 如何开启Linux Bash命令行? ...