Jsoup解析html终于成功了!!!
package com.eric.pickupjoke.activity; import java.io.IOException;
import java.io.InputStream;
import java.util.ArrayList;
import java.util.Calendar;
import java.util.HashMap;
import java.util.List;
import java.util.Locale;
import java.util.Map; import org.apache.http.HttpResponse;
import org.apache.http.HttpStatus;
import org.apache.http.client.ClientProtocolException;
import org.apache.http.client.HttpClient;
import org.apache.http.client.methods.HttpGet;
import org.apache.http.impl.client.DefaultHttpClient;
import org.apache.http.util.EntityUtils;
import org.jsoup.Jsoup;
import org.jsoup.nodes.Document;
import org.jsoup.nodes.Element;
import org.jsoup.nodes.TextNode;
import org.jsoup.select.Elements; import android.app.Activity;
import android.graphics.drawable.ColorDrawable;
import android.os.AsyncTask;
import android.os.Bundle;
import android.util.Log;
import android.view.Menu;
import android.widget.SimpleAdapter;
import android.widget.Toast; import com.eric.pickupjoke.conn.IsConnection;
import com.eric.pickupjoke.listview.MyListView;
import com.eric.pickupjoke.listview.MyListView.OnMoreListener;
import com.eric.pickupjoke.listview.MyListView.OnRefreshListener; public class AdultJokeActivity extends Activity {
MyListView articleListView;
List<HashMap<String, String>> articleList;
SimpleAdapter adapter;
OnRefreshListener mOnRefreshListener;
OnMoreListener mOnMoreListener;
static int index = 2; @Override
protected void onCreate(Bundle savedInstanceState) {
super.onCreate(savedInstanceState);
setContentView(R.layout.activity_adult_joke);
init();
} void init() {
getWindow().setBackgroundDrawable(new ColorDrawable(-1));
articleListView = (MyListView) findViewById(R.id.article_list_view);
articleList = new ArrayList<HashMap<String, String>>();
InputStream is;
try {
is = this.getResources().getAssets().open("source_html.html");
Document doc = Jsoup.parse(is, "GBK", "http://www.haha365.com");
Log.i("AsyncTask in AdultJokeActivity", "5");
Elements twoArticleElements = doc
.select("div.content>div.left>div.r_c>div.cat_llb");
Log.i("AsyncTask in AdultJokeActivity", "6");
if (twoArticleElements != null && twoArticleElements.size() > 0) {
for (Element twoArticleElement : twoArticleElements) {
Log.i("AsyncTask in AdultJokeActivity", "7");
List<TextNode> textList = twoArticleElement.textNodes();
Map<String, String> map1 = new HashMap<String, String>();
Map<String, String> map2 = new HashMap<String, String>();
Log.i("AsyncTask in AdultJokeActivity", "8");
map1.put("time", textList.get(0).text());
map1.put("title", twoArticleElement.child(1).text());
map1.put("content", twoArticleElement.child(3).text());
map2.put("time", textList.get(4).text());
map2.put("title", twoArticleElement.child(6).text());
map2.put("content", twoArticleElement.child(8).text());
Log.i("AsyncTask in AdultJokeActivity", "9");
articleList.add((HashMap<String, String>) map1);
articleList.add((HashMap<String, String>) map2);
Log.i("AsyncTask in AdultJokeActivity", "10");
}
}
} catch (IOException e) {
e.printStackTrace();
}
Log.i("init() in AdultJokeActivity", "1");
adapter = new SimpleAdapter(this, articleList,
R.layout.article_list_item, new String[] { "title", "content",
"time" }, new int[] { R.id.title, R.id.content,
R.id.time });
articleListView.setAdapter(adapter);
Log.i("init() in AdultJokeActivity", "2"); mOnRefreshListener = new OnRefreshListener() {
@Override
public void onRefresh() {
Log.i("onRefresh in AdultJokeActivity", "1");
if (new IsConnection(AdultJokeActivity.this).isConnected()) {
new LoadArticleTask()
.execute("http://www.haha365.com/Adult_joke/"); }
}
};
mOnMoreListener = new OnMoreListener() {
@Override
public void onMore() {
Log.i("onMore in AdultJokeActivity", "1");
if (new IsConnection(AdultJokeActivity.this).isConnected()
&& index <= 18) {
new LoadArticleTask()
.execute("http://www.haha365.com/Adult_joke/index_"
+ String.valueOf(index) + ".htm");
index++;
} }
};
articleListView.setOnRefreshListener(mOnRefreshListener);
articleListView.setOnMoreListener(mOnMoreListener);
} private class LoadArticleTask extends AsyncTask<String, Void, String> {
@Override
protected String doInBackground(String... urls) {
try {
Log.i("AsyncTask in AdultJokeActivity", "1");
HttpClient httpClient = new DefaultHttpClient();
HttpGet httpGet = new HttpGet(urls[0]);
HttpResponse httpResponse = httpClient.execute(httpGet);
Log.i("AsyncTask in AdultJokeActivity", "2");
if (httpResponse.getStatusLine().getStatusCode() == HttpStatus.SC_OK) {
Log.i("AsyncTask in AdultJokeActivity", "3");
String html = EntityUtils.toString(
httpResponse.getEntity(), "GBK");
// System.out.println(html);
Log.i("AsyncTask in AdultJokeActivity", "4");
return html;
} else {
Toast.makeText(AdultJokeActivity.this, "获取HTML文档失败",
Toast.LENGTH_SHORT).show();
return null;
}
} catch (ClientProtocolException e) {
e.printStackTrace();
return null;
} catch (IOException e) {
e.printStackTrace();
return null;
}
} @Override
protected void onPostExecute(String html) {
Document doc = Jsoup.parse(html);
Log.i("AsyncTask in AdultJokeActivity", "5");
Elements twoArticleElements = doc
.select("div.content>div.left>div.r_c>div.cat_llb");
Log.i("AsyncTask in AdultJokeActivity", "6");
if (twoArticleElements != null && twoArticleElements.size() > 0) {
for (Element twoArticleElement : twoArticleElements) {
Log.i("AsyncTask in AdultJokeActivity", "7");
List<TextNode> textList = twoArticleElement.textNodes();
Map<String, String> map1 = new HashMap<String, String>();
Map<String, String> map2 = new HashMap<String, String>();
Log.i("AsyncTask in AdultJokeActivity", "8");
map1.put("time", textList.get(0).text());
map1.put("title", twoArticleElement.child(1).text());
map1.put("content", twoArticleElement.child(3).text());
map2.put("time", textList.get(4).text());
map2.put("title", twoArticleElement.child(6).text());
map2.put("content", twoArticleElement.child(8).text());
Log.i("AsyncTask in AdultJokeActivity", "9");
articleList.add((HashMap<String, String>) map1);
articleList.add((HashMap<String, String>) map2);
Log.i("AsyncTask in AdultJokeActivity", "10");
}
} else {
Log.i("AsyncTask in AdultJokeActivity", "8");
}
adapter.notifyDataSetChanged();
articleListView.onRefreshComplete("更新时间:" + getCalendarString());
articleListView.onMoreComplete();
Log.i("AsyncTask in AdultJokeActivity", "11");
}
} @Override
public boolean onCreateOptionsMenu(Menu menu) {
// Inflate the menu; this adds items to the action bar if it is present.
getMenuInflater().inflate(R.menu.adult_joke, menu);
return true;
} public String getCalendarString() {
Calendar c = Calendar.getInstance(Locale.CHINA);
int mHour = c.get(Calendar.HOUR_OF_DAY);
int mMinter = c.get(Calendar.MINUTE);
return String.valueOf(mHour) + ":" + String.valueOf(mMinter);
} }
Jsoup解析html终于成功了!!!的更多相关文章
- 一步步教你为网站开发Android客户端---HttpWatch抓包,HttpClient模拟POST请求,Jsoup解析HTML代码,动态更新ListView
本文面向Android初级开发者,有一定的Java和Android知识即可. 文章覆盖知识点:HttpWatch抓包,HttpClient模拟POST请求,Jsoup解析HTML代码,动态更新List ...
- Android利用Jsoup解析html 开发网站客户端小记。
这些天业余时间比较多,闲来无事,想起了以前看过开发任意网站客户端的一篇文章,就是利用jsoup解析网站网页,通过标签获取想要的内容.好了废话不多说,用到的工具为 jsoup-1.7.2.jar包,具体 ...
- [java] jsoup 解析网页获取省市区域信息
到国家统计局抓取数据, 到该class下解析数据 /** * jsoup解析网页 * @author xwolf * @date 2016-12-13 18:11 * @since V1.0.0 */ ...
- jsoup解析HTML及简单实例
jsoup 中文参考文献 http://www.open-open.com/jsoup/ 本文将利用jsoup,简单实现网络抓取的功能,并给出一个小实例,该实例效果为:获取作者本人在博客园写的所 ...
- jsoup解析HTML
Connection conn = Jsoup.connect(String url); conn.data("txtBill", key);// 设置关键字查询字段 Docume ...
- Android开发探秘之三:利用jsoup解析HTML页面
这节主要是讲解jsoup解析HTML页面.由于在android开发过程中,不可避免的涉及到web页面的抓取,解析,展示等等,所以,在这里我主要展示下利用jsoup jar包来抓取cnbeta.com网 ...
- 终于成功仿了一次Kalman滤波器
终于成功仿了一次Kalman滤波器 首先是测试了从网上down的一段代码 % KALMANF - updates a system state vector estimate based upon a ...
- Jsoup 解析 HTML
Jsoup 文档 方法 要取得一个属性的值,可以使用Node.attr(String key) 方法 对于一个元素中的文本,可以使用Element.text()方法 对于要取得元素或属性中的HTML内 ...
- Jsoup解析HTML、加载文档等实例
一.引入jsoup的jar包:http://jsoup.org/download 补充:http://jsoup.org/apidocs/ Jsoup API 可以了解更详细的内容 二.Js ...
随机推荐
- Windows下Go语言的环境搭建
在本地搭建了一个开发GO语言的开发环境,给大家分享一下用go语言写的第一个hello world的过程,希望对大家有所帮助. 1.想写GO语言首先得下载go语言的开发包 官方下载地址:https:// ...
- MySQL数据类型的验证
CHAR char (M) M字符,长度是M*字符编码长度,M最大255. 验证如下: mysql)) default charset=utf8; ERROR (): ); use BLOB or T ...
- 【记录】T-SQL 分组排序中取出最新数据
示例 Product 表结构: 示例 Product 表数据: 想要的效果是,以 GroupName 字段分组,取出分组中通过 Sort 降序最新的数据,通过示例数据,可以推算出结果数据的 ID 应该 ...
- aud$定位错误用户密码登陆数据库的具体信息
环境:Oracle 11.2.0.3 客户端使用错误的用户密码登陆数据库 查询最近1天由于密码错误登陆失败的信息 查询当前审计中有哪些returncode值 1. 客户端使用错误的用户密码登陆数据库 ...
- 【JUC】JDK1.8源码分析之ConcurrentSkipListMap(二)
一.前言 最近在做项目的同时也在修复之前项目的一些Bug,所以忙得没有时间看源代码,今天都完成得差不多了,所以又开始源码分析之路,也着笔记录下ConcurrentSkipListMap的源码的分析过程 ...
- C# 中的as和is小结
在读.Net 框架设计的时候,关于C#中类型转化中的部分内容,在此总结记录,分享予大家. 首先,我们声明一个简单的继承关系. Class Father { Int x; } Class Child:F ...
- 11.struts2文件上传
文件上传 1.上传单个文件 2.上传多个文件 1.上传单个文件 实现步骤: (1)导入一个Jar包:commons-io-1.3.2.jar.只所以要导入这个Jar包,是因为要用到一个工具类Fil ...
- Azure Media Service (1) 使用OBS进行Azure Media Service直播
<Windows Azure Platform 系列文章目录> 今天正好有客户问如何使用OBS进行Azure Media Service直播,我这里简单介绍一下. 先决条件: 1. OBS ...
- clr enabled Server Configuration Option
在SQL Server中启用CLR,可以执行下面SQL语句: EXEC sp_configure 'clr enabled'; '; RECONFIGURE; Source Code
- C#开发微信门户及应用(29)--微信个性化菜单的实现
有一段时间没有接着微信的主题继续介绍里面的功能模块了,这段时间来,微信也做了不少的变化改动,针对这些特性我全面核对了一下相关的微信公众号和企业号的接口,对原有的微信API和系统管理做了全面的更新,本随 ...