xiaofud
diff --git a/‎.idea/workspace.xml
Lines changed: 116 additions & 25 deletions b/‎.idea/workspace.xml
Lines changed: 116 additions & 25 deletions
diff --git a/‎ielts_news.py
Lines changed: 64 additions & 0 deletions b/‎ielts_news.py
Lines changed: 64 additions & 0 deletions
diff --git a/‎internetUtil.py renamed to ‎loginUtil.py b/‎internetUtil.py renamed to ‎loginUtil.py
diff --git a/‎totalCodeLine.py
Lines changed: 2 additions & 1 deletion b/‎totalCodeLine.py
Lines changed: 2 additions & 1 deletion
@@ -0,0 +1,64 @@
+#!/usr/bin/env python3
+# coding=utf-8
+__author__ = 'smallfly'
+
+import requests
+from bs4 import BeautifulSoup
+
+NEWS_ADDRESS = "https://ielts.etest.net.cn/allnews"
+
+class NewsItem:
+
+    def __init__(self, date, title, url):
+        self.__data = {
+            "date": date,
+            "title": title,
+            "url": url
+        }
+
+    def __repr__(self):
+        return repr(self.__data)
+
+    def __getattr__(self, item):
+        if item in self.__data:
+            return self.__data[item]
+        raise AttributeError("NewsItem has no attribute named {}.".format(item))
+
+
+def get_raw_news(address):
+    resp = requests.get(address)
+    if resp.ok:
+        resp.encoding = "UTF-8"
+        return resp.text
+    else:
+        return None
+
+def parse_news(content):
+    soup = BeautifulSoup(content)
+    all_news_li = soup.find_all("li", {"class": "main-sub-act-new"})
+    news_items = []
+    for li in all_news_li:
+        # 存有新闻链接a标签的span标签
+        span_with_a_tag = li.contents[0]
+        # 存有发布时间的span标签
+        span_with_date = li.contents[1]
+        # 存放新闻链接的a标签
+        a_tag = span_with_a_tag.a
+        date_string = span_with_date.string.strip()
+        news_items.append(NewsItem(date_string[1: len(date_string) - 1], a_tag.string.strip(), a_tag["href"]))
+        # print(span_with_date.string.strip(), a_tag.string, a_tag["href"])
+    return news_items
+
+def pretty_print(items):
+    items.sort(key=lambda x: x.date, reverse=True)
+    for item in items:
+        print("Date:", item.date)
+        print("Title:", item.title)
+        print("URL:", item.url)
+        print()
+
+if __name__ == "__main__":
+    content = get_raw_news(NEWS_ADDRESS)
+    if content is not None:
+        items = parse_news(content)
+        pretty_print(items)
@@ -23,7 +23,7 @@ def get_suffix():
     """
     suffix_list = list()
     while True:
-        suffix = input("input the suffix like .cpp(end input by empty line)\n")
+        suffix = input("input the suffix like cpp(end input by empty line)\n")
         suffix = suffix.strip()
         if suffix == "":
             break
@@ -43,6 +43,7 @@ def get_line_count(root_path, suffix_list):
             # print(os.path.abspath(file))
             # 匹配后缀名
             file_suffix = os.path.splitext(file)[1]
+            file_suffix = file_suffix.strip('.')
             if file_suffix in suffix_list:
                 # 读取该文件
                 with open(os.path.join(root, file)) as f: