当前位置：移动技术网 > 移动技术>移动开发>Android > android Jsoup获取网站内容 android获取新闻标题实例

android Jsoup获取网站内容 android获取新闻标题实例

2019年07月24日 | 移动技术网移动技术 | 我要评论

近期做简单的新闻客户端界面使用到了jsoup获取，使用起来特别方便，这也是被我一个学长称为学android网络必学的一个东西，在此也是分享一下自己近期所学。

首先还是给出效果：

上面是通过textview显示的一个从网站上获取的所有内容的显示，下面是通过listview显示一下获取的新闻的标题，如此显示比较便于理解。

mainactivity：

import android.app.activity; 
import android.content.intent; 
import android.net.uri; 
import android.os.asynctask; 
import android.os.bundle; 
import android.text.method.scrollingmovementmethod; 
import android.util.log; 
import android.view.menu; 
import android.view.view; 
import android.widget.adapterview; 
import android.widget.adapterview.onitemclicklistener; 
import android.widget.arrayadapter; 
import android.widget.listview; 
import android.widget.textview; 
 
import org.apache.http.httpresponse; 
import org.apache.http.client.httpclient; 
import org.apache.http.client.methods.httppost; 
import org.apache.http.impl.client.defaulthttpclient; 
import org.apache.http.util.entityutils; 
import org.jsoup.jsoup; 
import org.jsoup.nodes.document; 
import org.jsoup.nodes.element; 
import org.jsoup.select.elements; 
 
import java.util.arraylist; 
import java.util.list; 
 
@suppresswarnings("unused") 
public class mainactivity extends activity { 
  private textview tv_htmlcode; 
  //此处搞一个textview主要来显示news列表里面存储的内容，仅仅便于分析和理解 
 
  private string url_eol = "http://www.cnwust.com/newslist/1_1", 
      tag = "atag"; 
  //这是索要获取内容的网址 
 
  private list<news> newslist; 
  //自定义的news的类，用于存放索要获取新闻的目录、时间以及点击后显示的网址 
 
  private listview lv_result; 
  private arrayadapter<string> lv_adapter; 
 
  @override 
  protected void oncreate(bundle savedinstancestate) { 
    super.oncreate(savedinstancestate); 
    setcontentview(r.layout.activity_main); 
    lv_result = (listview) findviewbyid(r.id.lv_result); 
    tv_htmlcode = (textview) findviewbyid(r.id.tv_htmlcode); 
    tv_htmlcode.setmovementmethod(scrollingmovementmethod.getinstance()); 
 
    connecttask c1 = new connecttask(); 
    c1.execute(); 
 
  } 
 
  @override 
  public boolean oncreateoptionsmenu(menu menu) { 
    getmenuinflater().inflate(r.menu.menu_main, menu); 
    return true; 
  } 
 
  public class connecttask extends asynctask<void, void, string> { 
 
    @override 
    protected string doinbackground(void... params) { 
      string result = connecteol(); 
      return result; 
    } 
 
    @override 
    protected void onpostexecute(string result) { 
      // tv_htmlcode.settext(result); 
      newslist = getnews(result); 
      list<string> newstitles = new arraylist<string>(); 
      for (news news : newslist) { 
        tv_htmlcode.append(news.getnewstitle() + "\n"); 
        tv_htmlcode.append(news.getnewstime() + "\n"); 
        tv_htmlcode.append(news.getnewsurl() + "\n"); 
        newstitles.add(news.getnewstitle()); 
      } 
    /* 为listview添加适配器 */ 
 
      lv_adapter = new arrayadapter<string>(mainactivity.this, 
          android.r.layout.simple_list_item_1, newstitles); 
      lv_result.setadapter(lv_adapter); 
 
    /* 为listview添加点击打开对应网页功能 */ 
      lv_result.setonitemclicklistener(new onitemclicklistener() { 
 
        @override 
        public void onitemclick(adapterview<?> arg0, view arg1, 
                    int arg2, long arg3) { 
          final uri uri = uri.parse(newslist.get(arg2).getnewsurl()); 
          final intent it = new intent(intent.action_view, uri); 
          startactivity(it); 
        } 
 
      }); 
      //此处为了方便就点击就直接调用设备默认浏览器打开网址 
 
      super.onpostexecute(result); 
 
 
    } 
 
  } 
 
  /* 连接eol的方法 返回整个网页经过截取之后的的源代码 */ 
  public string connecteol() { 
    string result = ""; 
    try { 
      httpclient httpclient = new defaulthttpclient(); 
      httppost httppost = new httppost(url_eol); 
      httpresponse response = httpclient.execute(httppost); 
      string res = entityutils.tostring(response.getentity(), "utf-8"); 
 
      int st = res.indexof("<div id=\"result\">"); 
      int ed = res.indexof("<div id=\"pager\">"); 
      //这边算是最重要的部分，代码获取的便是这两段之间的部分。 
 
      string content = res.substring(st, ed); 
      st = content.indexof("<ul>") + 4; 
      ed = content.indexof("</ul>"); 
      content = content.substring(st, ed); 
      result = content; 
    } catch (exception e) { 
      log.d(tag, e.tostring()); 
    } 
    return result; 
  } 
 
  /* 对源代码进行解析截取的方法 返回一个news数组 */ 
  public list<news> getnews(string htmlcode) { 
    list<news> newslist = new arraylist<news>(); 
    document doc = jsoup.parse(htmlcode); 
    log.d(tag, "解析html中"); 
    elements lis = doc.getelementsbytag("li"); 
    log.d(tag, "lis的size " + lis.size()); 
    for (element li : lis) { 
      string newstime = li.getelementsbytag("span").text(); 
      string newstitle = li.getelementsbytag("a").text(); 
      string newsurl = li.getelementsbytag("a").attr("href"); 
      //这三段算是jsoup从html中获取内容的关键了，很容易理解。 
 
      newsurl = newsurl.replace("/news", "http://www.cnwust.com/news"); 
      //直接从html的代码中获取的url是相对路径，此处使用replace改为绝对路径 
 
      log.d(tag, newstime); 
      log.d(tag, newstitle); 
      log.d(tag, newsurl); 
 
      news newst = new news(); 
      newst.setnewstime(newstime); 
      newst.setnewstitle(newstitle); 
      newst.setnewsurl(newsurl); 
      newslist.add(newst); 
    } 
    return newslist; 
  } 
}

news：

public class news { 
  private string newstime; 
  private string newsurl; 
  private string newstitle; 
 
  public news() { 
 
  } 
 
  public news(string newstitle, string newstime, string newsurl) { 
    this.newstime = newstime; 
    this.newsurl = newsurl; 
    this.newstitle = newstitle; 
  } 
 
  public string getnewstime() { 
    return newstime; 
  } 
 
  public void setnewstime(string newstime) { 
    this.newstime = newstime; 
  } 
 
  public string getnewsurl() { 
    return newsurl; 
  } 
 
  public void setnewsurl(string newsurl) { 
    this.newsurl = newsurl; 
  } 
 
  public string getnewstitle() { 
    return newstitle; 
  } 
 
  public void setnewstitle(string newstitle) { 
    this.newstitle = newstitle; 
  } 
 
}

activity_main:

<relativelayout xmlns:android="http://schemas.android.com/apk/res/android" 
  xmlns:tools="http://schemas.android.com/tools" 
  android:layout_width="match_parent" 
  android:layout_height="match_parent" 
  android:paddingbottom="@dimen/activity_vertical_margin" 
  android:paddingleft="@dimen/activity_horizontal_margin" 
  android:paddingright="@dimen/activity_horizontal_margin" 
  android:paddingtop="@dimen/activity_vertical_margin" 
  tools:context=".newslist" > 
 
  <textview 
    android:id="@+id/tv_htmlcode" 
    android:layout_width="match_parent" 
    android:layout_height="150dp" 
    android:layout_above="@+id/lv_result" 
    android:layout_alignparenttop="true" 
    android:layout_centerhorizontal="true" 
    android:scrollbars="vertical" /> 
 
  <listview 
    android:id="@+id/lv_result" 
    android:layout_width="match_parent" 
    android:layout_height="230dp" 
    android:layout_alignleft="@+id/tv_htmlcode" 
    android:layout_alignparentbottom="true" > 
  </listview> 
 
</relativelayout>

此处对html代码的解析可能部分新手还是不太清楚，在此也是建议使用chrome浏览器，可以直接查看网站的源码。（有部分加密的网站看不到）下面看一下具体使用的截图：

1、首先先要打开到你要获取内容的网站

2、右击你要获取的内容，并选择审查元素。

3、使用jsoup解析html代码。

最后是附上源码

以上就是本文的全部内容，希望对大家的学习有所帮助，也希望大家多多支持移动技术网。

您可能感兴趣的文章:

如对本文有疑问，点击进行留言回复！！

WebRTC拥塞控制之REMB and GCC

前言WebRTC在处理网络拥塞问题时一般有网络拥塞（congestion）是指在分组交换网络中传送分组的数目太多... [阅读全文]
Unity性能优化---音频

向unity中导入音频文件总是会让内存增加，因此对音频文件的压缩变得更加重要 ... [阅读全文]
IjkPlayer【1】 Demo Android的最简单实现

一、目的 Ijkplayer最为一个经典的视屏播放开源框架，虽然是开源框架对于刚入门的人来说看到源码以及脚本的... [阅读全文]
教你怎么把微信小程序分享到朋友圈

7月8日收到邀请，可将小程序页面分享到朋友圈。适用于内容型页面的分享，不适用于有较多交互的页面分享。该功能为be... [阅读全文]
一起Talk Android吧（第二百六十回：Android中的BottomNavigationView概述）

各位看官们大家好，上一回中咱们说的是Android中Toolbar的例子,这一回咱们说的例子是BottomNav... [阅读全文]
数据压缩实验六 MPEG音频编码实验

一、实验原理1、感知编码的基本思路（1）心理声学模型：听觉系统中存在一个听觉阈值电平，低于这个电平的声音信号就听... [阅读全文]
Android记之语言Binder

理解binder设计binder是为了设计一套 [阅读全文]
android调节音量——AudioManager的应用

下面博客链接为实例代码链接，本章博客就不重复写了。我主要总结了一个方法，方便开发时候使用。AudioManage... [阅读全文]
Android图片印刻，阳刻，素描图效果处理

介绍我参与开发的妙趣剪纸app使用的图片处理相关的技术关于妙趣剪纸，各大android商店都可以下载，下面贴出小... [阅读全文]
电路设计、分析、仿真之2：电流检测及保护电路仿真

原理图注: V1代替电流采样信号。差分电路仿真和分析差分电路由U1D及周边元件所组成。其放大倍数为15K/1K=... [阅读全文]

网友评论


验证码：

android Jsoup获取网站内容 android获取新闻标题实例

2019年07月24日 | 移动技术网移动技术 | 我要评论

您可能感兴趣的文章:

相关文章:

网友评论