This repository was archived by the owner on Oct 15, 2020. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 10
/
Copy pathgithub.py
61 lines (47 loc) · 1.85 KB
/
github.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
#from .magic import process_url
import titledb.magic
from .models import (
DBSession,
URL
)
import json
import re
import requests
import transaction
import logging
log = logging.getLogger(__name__)
def github_full_scan(cache_root=None):
url_like = 'https://github.com/%/releases/download/%'
urls = DBSession.query(URL).filter_by(active=True).filter(URL.url.like(url_like)).all()
api_urls = []
if urls:
for url in urls:
(repouser, reponame) = github_parse_user_repo(url)
api_urls.append(github_user_repo_to_api(repouser, reponame))
api_urls = set(api_urls)
headers = {}
headers['User-Agent'] = 'Mozilla/5.0 (Nintendo 3DS; Mobile; rv:10.0) Gecko/20100101 TitleDB/1.0'
for github_api_url in api_urls:
userpass = json.load(open("private/github_credentials.json"))
req = requests.get(github_api_url, headers=headers, auth=(userpass['username'],userpass['password']))
data = json.loads(req.text)
#import pdb; pdb.set_trace()
if 'assets' in data:
for asset in data['assets']:
try:
with transaction.manager:
with DBSession.begin_nested():
titledb.magic.process_url(asset['browser_download_url'], cache_root=cache_root)
#transaction.commit()
except:
transaction.rollback()
else:
log.info("GitHub API Failure: %s", github_api_url)
def github_parse_user_repo(url):
m = re.fullmatch('https?://github.com/([^/]+)/([^/]+)/releases/download/.*/[^/]+', url.url)
log.debug(m)
if m:
return(m.group(1), m.group(2))
return (None, None)
def github_user_repo_to_api(repouser, reponame):
return('https://api.github.com/repos/' + repouser + '/' + reponame + '/releases/latest')