Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
13 changes: 13 additions & 0 deletions 1.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,13 @@
import xml.etree.ElementTree as ET
from urllib.request import urlopen
import json

data = urlopen('https://lenta.ru/rss').read().decode('utf8')
root = ET.fromstring(data)


newsJson = [{'pubDate': i.find('pubDate').text, 'title': i.find('title').text}
for i in root.iter('item')]

with open("news.json", "w", encoding='UTF-8') as file:
json.dump(newsJson, file, ensure_ascii=False, indent=1)
13 changes: 13 additions & 0 deletions 2.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,13 @@
import xml.etree.ElementTree as ET
from urllib.request import urlopen
import json

data = urlopen('https://lenta.ru/rss').read().decode('utf8')
root = ET.fromstring(data)


newsJson = [{n.tag: n.text for n in i}
for i in root.iter('item')]

with open("news_all.json", "w", encoding='UTF-8') as file:
json.dump(newsJson, file, ensure_ascii=False, indent=1)
13 changes: 13 additions & 0 deletions API_Gradskiy.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,13 @@
from itertools import groupby
from json import loads
from urllib.request import urlopen

url = 'https://ru.wikipedia.org/w/api.php?action=query&format=json&prop=revisions&rvlimit=500&titles=%D0%93%D1%80%D0%B0%D0%B4%D1%81%D0%BA%D0%B8%D0%B9,_%D0%90%D0%BB%D0%B5%D0%BA%D1%81%D0%B0%D0%BD%D0%B4%D1%80_%D0%91%D0%BE%D1%80%D0%B8%D1%81%D0%BE%D0%B2%D0%B8%D1%87'

data = loads(urlopen(url).read().decode('utf8'))
editData = groupby(i['timestamp'][:10]
for i in data['query']['pages']['183903']['revisions'])
for date, edits in editData:
print(date, len(list(edits)))
# дата: 2021-11-28 кол-во: 153
# Всплеск правок в эту дату связан со смертью Александра Градского.
14 changes: 14 additions & 0 deletions API_Zhan-Pol_Correlation.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
from itertools import groupby
from json import loads
from urllib.request import urlopen

url = 'https://ru.wikipedia.org/w/api.php?action=query&format=json&prop=revisions&rvlimit=500&titles=%D0%91%D0%B5%D0%BB%D1%8C%D0%BC%D0%BE%D0%BD%D0%B4%D0%BE,_%D0%96%D0%B0%D0%BD-%D0%9F%D0%BE%D0%BB%D1%8C'

data = loads(urlopen(url).read().decode('utf8'))
editData = groupby(i['timestamp'][:10]
for i in data['query']['pages']['192203']['revisions'])
for date, edits in editData:
print(date, len(list(edits)))
# дата: 2021-09-06 кол-во: 58
# В эту дату и правда умер Жан-Поль Бельмондо,
# но такой способ не очень удобен, т.к большое количество правок может быть связано с разными событиями.
Loading