Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 9 additions & 0 deletions API.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
from itertools import groupby
from json import loads
from urllib.request import urlopen

url = 'https://ru.wikipedia.org/w/api.php?action=query&format=json&prop=revisions&rvlimit=500&titles=%D0%93%D1%80%D0%B0%D0%B4%D1%81%D0%BA%D0%B8%D0%B9,_%D0%90%D0%BB%D0%B5%D0%BA%D1%81%D0%B0%D0%BD%D0%B4%D1%80_%D0%91%D0%BE%D1%80%D0%B8%D1%81%D0%BE%D0%B2%D0%B8%D1%87'
data = loads(urlopen(url).read().decode('utf8'))

group_data = groupby([i['timestamp'][:10] for i in data['query']['pages']['183903']['revisions']])
[print(d, len(list(e))) for d, e in group_data]
18 changes: 18 additions & 0 deletions correlation.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,18 @@
from itertools import groupby
from json import loads
from urllib.request import urlopen

def sort_by_revisions(gr):
date, m = '', 0
for d, e in gr:
c = len(list(e))
if c <= m:
continue
date, m = d, c
return date

url = 'https://ru.wikipedia.org/w/api.php?action=query&format=json&prop=revisions&rvlimit=500&titles=%D0%91%D0%B5%D0%BB%D1%8C%D0%BC%D0%BE%D0%BD%D0%B4%D0%BE,_%D0%96%D0%B0%D0%BD-%D0%9F%D0%BE%D0%BB%D1%8C '
data = loads(urlopen(url).read().decode('utf8'))

grouped_data = groupby([i['timestamp'][:10] for i in data['query']['pages']['192203']['revisions']])
print(sort_by_revisions(grouped_data))
802 changes: 802 additions & 0 deletions news.json

Large diffs are not rendered by default.

16 changes: 16 additions & 0 deletions news1.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,16 @@
from xml.etree.ElementTree import fromstring
from json import dump
from urllib.request import urlopen

data = urlopen('https://lenta.ru/rss').read().decode('utf8')
root = fromstring(data)

res = []
for i in root.findall('channel/item'):
res.append({
'pubDate': i.find('pubDate').text,
'title': i.find('title').text
})

with open("news.json", "w", encoding='UTF-8') as out:
dump(res, out, indent=1, ensure_ascii=False)
1,998 changes: 1,998 additions & 0 deletions news2.json

Large diffs are not rendered by default.

12 changes: 12 additions & 0 deletions news2.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
from json import dump
from urllib.request import urlopen
from xml.etree.ElementTree import fromstring

res = []
for item in fromstring(urlopen('https://lenta.ru/rss').read().decode('utf8')).findall('channel/item'):
res.append({
c.tag: c.text for c in item
})

with open("news2.json", "w", encoding='UTF-8') as out:
dump(res, out, indent=1, ensure_ascii=False)
14 changes: 14 additions & 0 deletions отчет.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
# Информация об Александре Градском

<img width="1280" alt="image" src="https://user-images.githubusercontent.com/73825639/146766685-a640332c-51dd-4f75-923f-28d6ea21669b.png">

Самое большое количество правок случилось 28.11.2021, в день смерти Александра Градского.

# Информация об Жан-Поле Бельмондо

<img width="1280" alt="image" src="https://user-images.githubusercontent.com/73825639/146767037-2683392b-d6ea-4e82-8ef6-b4848530064b.png">

Резкий скачок правок произол 6.09.2021 - в день смерти Жан-Поля Бельмондо.

День, в который случилось больше всего правок - совпал с датой смерти Жан-Поля Бельмондо.
Но такой метод нельзя использовать, потому что большое количество правок могло было вызвано другими событиями.