mirror of
https://github.com/TrentSPalmer/hugo_themes_report.git
synced 2025-01-08 20:48:21 -08:00
major rewrite rank_hugo_themes.py
This commit is contained in:
parent
cb8c491a3e
commit
46b919ff50
@ -2,40 +2,40 @@
|
||||
# rank_hugo_themes.py
|
||||
|
||||
import re
|
||||
import toml
|
||||
import toml
|
||||
from calendar import timegm
|
||||
from time import strptime
|
||||
from requests import get
|
||||
from json import loads as json_loads
|
||||
# from json import loads as json_loads
|
||||
from sys import argv as sys_argv
|
||||
from base64 import b64decode
|
||||
from ast import literal_eval
|
||||
|
||||
from sqlalchemy import create_engine,Column,Integer,VARCHAR,TEXT
|
||||
from sqlalchemy import create_engine, Column, Integer, VARCHAR, TEXT
|
||||
from sqlalchemy.ext.declarative import declarative_base
|
||||
from sqlalchemy.orm import deferred,sessionmaker
|
||||
from sqlalchemy.orm import deferred, sessionmaker
|
||||
|
||||
engine = create_engine('sqlite:///hugothemes.db',echo=False)
|
||||
engine = create_engine('sqlite:///hugothemes.db', echo=False)
|
||||
Base = declarative_base()
|
||||
|
||||
|
||||
class Tags(Base):
|
||||
__tablename__ = 'tags'
|
||||
|
||||
tag = Column(VARCHAR,primary_key=True)
|
||||
tag = Column(VARCHAR, primary_key=True)
|
||||
theme_list = Column(TEXT)
|
||||
num_themes = Column(Integer)
|
||||
|
||||
def __repr__(self):
|
||||
repr_string = "<(tag = '%s', theme_list = '%s', num_themes = '%s')>"
|
||||
repr_values = (self.tag,self.theme_list,self.num_themes)
|
||||
repr_values = (self.tag, self.theme_list, self.num_themes)
|
||||
return repr_string % repr_values
|
||||
|
||||
|
||||
class Hugothemes_from_gitlab(Base):
|
||||
__tablename__ = 'hugothemes_from_gitlab'
|
||||
|
||||
name = Column(VARCHAR,primary_key=True)
|
||||
name = Column(VARCHAR, primary_key=True)
|
||||
url = Column(TEXT)
|
||||
commit_sha = Column(TEXT)
|
||||
gitlab_id = Column(TEXT)
|
||||
@ -43,22 +43,25 @@ class Hugothemes_from_gitlab(Base):
|
||||
commit_date = Column(TEXT)
|
||||
star_count = Column(Integer)
|
||||
themes_toml_content = Column(TEXT)
|
||||
default_branch = Column(TEXT)
|
||||
|
||||
def __repr__(self):
|
||||
repr_string = "<(name = '%s', url = '%s', commit_sha = '%s', gitlab_id = '%s', commit_date_in_seconds = '%s'"
|
||||
repr_string += ", commit_date = '%s', star_count = '%s', themes_toml_content = '%s')>"
|
||||
repr_values = (self.name,self.commit_sha,self.gitlab_id,self.commit_date_in_seconds,self.commit_date,
|
||||
self.star_count,self.themes_toml_content)
|
||||
repr_string += ", commit_date = '%s', star_count = '%s', themes_toml_content = '%s', default_branch = '%s')>"
|
||||
repr_values = (
|
||||
self.name, self.commit_sha, self.gitlab_id,
|
||||
self.commit_date_in_seconds, self.commit_date,
|
||||
self.star_count, self.themes_toml_content, self.default_branch
|
||||
)
|
||||
return repr_string % repr_values
|
||||
|
||||
|
||||
class Hugothemes(Base):
|
||||
__tablename__ = 'hugothemes'
|
||||
|
||||
name = Column(VARCHAR,primary_key=True)
|
||||
name = Column(VARCHAR, primary_key=True)
|
||||
ETag = Column(TEXT)
|
||||
url = Column(TEXT)
|
||||
jsondump = deferred(Column(TEXT))
|
||||
commit_sha = Column(TEXT)
|
||||
commit_date = Column(TEXT)
|
||||
commit_date_in_seconds = Column(Integer)
|
||||
@ -68,166 +71,106 @@ class Hugothemes(Base):
|
||||
themes_toml_content = deferred(Column(TEXT))
|
||||
tags_list = Column(TEXT)
|
||||
num_tags = Column(Integer)
|
||||
dot_gitmodules_content = Column(TEXT)
|
||||
default_branch = Column(TEXT)
|
||||
|
||||
def __repr__(self):
|
||||
repr_string = "<(name = '%s', ETag = '%s', url = '%s', jsondump = '%s', commit_sha = '%s', commit_date = '%s'"
|
||||
repr_string = "<(name = '%s', ETag = '%s', url = '%s', commit_sha = '%s', commit_date = '%s'"
|
||||
repr_string += ", commit_date_in_seconds = '%s', repo_ETag = '%s', stargazers_count = '%s', themes_toml_ETag = '%s'"
|
||||
repr_string += ", themes_toml_content = '%s', tags_list = '%s', num_tags = '%s', dot_gitmodule_content = '%s')>"
|
||||
repr_values = (self.name,self.ETag,self.url,self.jsondump,self.commit_sha,self.commit_date,self.commit_date_in_seconds,
|
||||
self.repo_ETag,self.stargazers_count,self.themes_toml_ETag,self.themes_toml_content,self.tags_list,
|
||||
self.num_tags,self.dot_gitmodules_content)
|
||||
repr_string += ", themes_toml_content = '%s', tags_list = '%s', num_tags = '%s', default_branch = '%s')>"
|
||||
repr_values = (
|
||||
self.name, self.ETag, self.url,
|
||||
self.commit_sha, self.commit_date, self.commit_date_in_seconds,
|
||||
self.repo_ETag, self.stargazers_count, self.themes_toml_ETag,
|
||||
self.themes_toml_content, self.tags_list,
|
||||
self.num_tags, self.default_branch
|
||||
)
|
||||
return repr_string % repr_values
|
||||
|
||||
|
||||
THEMESLISTREPO = 'gohugoio/hugoThemes'
|
||||
OLDTHEMESLISTREPO = 'gohugoio/hugoThemes'
|
||||
THEMESLISTREPO = 'gohugoio/hugoThemesSiteBuilder'
|
||||
THEMESLIST = []
|
||||
|
||||
|
||||
def get_themes_name_list():
|
||||
return [x[11:] for x in THEMESLIST]
|
||||
|
||||
|
||||
def get_gitlab_themes_list():
|
||||
return [x for x in THEMESLIST if x[0:10] == 'gitlab.com']
|
||||
|
||||
|
||||
def get_gitlab_themes_name_list():
|
||||
return [x[11:] for x in THEMESLIST if x[0:10] == 'gitlab.com']
|
||||
|
||||
|
||||
def get_github_themes_name_list():
|
||||
return [x[11:] for x in THEMESLIST if x[0:10] == 'github.com']
|
||||
|
||||
|
||||
if len(sys_argv) == 2:
|
||||
headers = { 'Authorization' : 'token ' + sys_argv[1] }
|
||||
headers = {'Authorization': 'token ' + sys_argv[1]}
|
||||
else:
|
||||
headers = {}
|
||||
|
||||
|
||||
def get_hugo_themes_list():
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes_list_repo = session.query(Hugothemes).filter_by(name=THEMESLISTREPO).first()
|
||||
api_call_url = "https://api.github.com/repos/"+THEMESLISTREPO+"/contents"
|
||||
if themes_list_repo.url != api_call_url: themes_list_repo.url = api_call_url
|
||||
themes_list_url = f"https://raw.githubusercontent.com/{THEMESLISTREPO}/main/themes.txt"
|
||||
response = get(themes_list_url)
|
||||
|
||||
if themes_list_repo.ETag != None:
|
||||
headers['If-None-Match'] = themes_list_repo.ETag
|
||||
else:
|
||||
if 'If-None-Match' in headers: del headers['If-None-Match']
|
||||
|
||||
if len(headers) == 0:
|
||||
response = get(api_call_url)
|
||||
else:
|
||||
response = get(api_call_url, headers=headers)
|
||||
if response.status_code == 200:
|
||||
themes_list_repo.ETag = response.headers['ETag'].lstrip('W/')
|
||||
themes_list_repo.jsondump = response.text
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code,get_hugo_themes_list.__name__)
|
||||
session.commit()
|
||||
write_reports()
|
||||
quit()
|
||||
print(response.status_code,get_hugo_themes_list.__name__)
|
||||
for x in response.text.splitlines():
|
||||
if (x[0:10] == 'gitlab.com' or x[0:10] == 'github.com'):
|
||||
THEMESLIST.append(x)
|
||||
|
||||
|
||||
def update_hugo_themes_submodule_list():
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes_list_repo = session.query(Hugothemes).filter_by(name=THEMESLISTREPO).first()
|
||||
themes_json = json_loads(themes_list_repo.jsondump)
|
||||
if themes_list_repo.dot_gitmodules_content:
|
||||
dot_gitmodule_json = json_loads(themes_list_repo.dot_gitmodules_content)
|
||||
for theme in themes_json:
|
||||
if theme['name'] == '.gitmodules':
|
||||
new_gitmodules_sha = theme['sha']
|
||||
break
|
||||
if (not dot_gitmodule_json) or (new_gitmodules_sha != dot_gitmodule_json['sha']):
|
||||
api_call_url = "https://api.github.com/repos/"+THEMESLISTREPO+"/contents/.gitmodules"
|
||||
response = get(api_call_url)
|
||||
if response.status_code == 200:
|
||||
if themes_list_repo.dot_gitmodules_content != response.text:
|
||||
themes_list_repo.dot_gitmodules_content = response.text
|
||||
session.commit()
|
||||
print(response.status_code,update_hugo_themes_submodule_list.__name__)
|
||||
|
||||
|
||||
def get_hugo_themes_submodule_list():
|
||||
session = sessionmaker(bind=engine)()
|
||||
dot_gitmodule_json_string = session.query(Hugothemes.dot_gitmodules_content).filter_by(name=THEMESLISTREPO).first()
|
||||
dot_gitmodule_json = json_loads(dot_gitmodule_json_string[0])
|
||||
dot_gitmodule_content = b64decode(dot_gitmodule_json['content']).decode('utf-8').replace('\n\n','\n').split('\n')
|
||||
submodules = []
|
||||
for line in range(len(dot_gitmodule_content[:-1])):
|
||||
if 'submodule' in dot_gitmodule_content[line]:
|
||||
name = re.sub(r'(^\[submodule "|"\]$)','',dot_gitmodule_content[line])
|
||||
if 'path = ' in dot_gitmodule_content[line+1]:
|
||||
path = re.match(r'^.*(path = )(.*)$',dot_gitmodule_content[line+1]).group(2)
|
||||
if 'url = ' in dot_gitmodule_content[line+2]:
|
||||
url = re.match(r'^.*(url = )(.*)$',dot_gitmodule_content[line+2]).group(2)
|
||||
submodules.append((name,path,url))
|
||||
return submodules
|
||||
print(response.status_code, get_hugo_themes_list.__name__)
|
||||
|
||||
|
||||
def clean_up():
|
||||
new_name_list = set()
|
||||
submodules = get_hugo_themes_submodule_list()
|
||||
for submodule in submodules:
|
||||
submodule_name = re.sub(r'(^https://github.com/|^https://gitlab.com/|\.git$)','',submodule[2])
|
||||
new_name_list.add(submodule_name)
|
||||
themes_name_list = get_themes_name_list()
|
||||
session = sessionmaker(bind=engine)()
|
||||
old_name_list = [theme[0] for theme in session.query(Hugothemes.name).filter(Hugothemes.name!=THEMESLISTREPO).all()]
|
||||
|
||||
for name in old_name_list:
|
||||
if name not in new_name_list:
|
||||
removed_theme = session.query(Hugothemes).filter_by(name=name).first()
|
||||
hugo_themes_name_list = [theme[0] for theme in session.query(Hugothemes.name).all()]
|
||||
for theme_name in hugo_themes_name_list:
|
||||
if theme_name not in themes_name_list:
|
||||
removed_theme = session.query(Hugothemes).filter_by(name=theme_name).first()
|
||||
session.delete(removed_theme)
|
||||
|
||||
themes_json_string = session.query(Hugothemes.jsondump).filter_by(name=THEMESLISTREPO).first()
|
||||
themes_json = json_loads(themes_json_string[0])
|
||||
new_name_list = set()
|
||||
for theme in themes_json:
|
||||
if theme['git_url']:
|
||||
if 'gohugoio' not in theme['git_url']:
|
||||
split_html_url = theme['html_url'].split('/')
|
||||
new_short_name = split_html_url[3]+'/'+split_html_url[4]
|
||||
new_name_list.add(new_short_name)
|
||||
|
||||
for name in old_name_list:
|
||||
if name not in new_name_list:
|
||||
removed_theme = session.query(Hugothemes).filter_by(name=name).first()
|
||||
if removed_theme != None: session.delete(removed_theme)
|
||||
session.commit()
|
||||
|
||||
|
||||
def parse_submodules_from_gitlab():
|
||||
submodules = get_hugo_themes_submodule_list()
|
||||
temp_submodules_list = []
|
||||
for submodule in submodules:
|
||||
if 'gitlab' in submodule[2]:
|
||||
temp_submodules_list.append(submodule)
|
||||
if (len(temp_submodules_list) > 0):
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes_json_string = session.query(Hugothemes.jsondump).filter_by(name=THEMESLISTREPO).first()
|
||||
themes_json = json_loads(themes_json_string[0])
|
||||
submodules_list = []
|
||||
for submodule in temp_submodules_list:
|
||||
for theme in themes_json:
|
||||
if submodule[0] == theme['name']:
|
||||
if (theme['html_url'] == None) or (theme['git_url'] == None):
|
||||
submodules_list.append((submodule[0],submodule[1],submodule[2],theme['sha']))
|
||||
if (len(submodules_list) > 0):
|
||||
for submodule in submodules_list:
|
||||
url = re.sub(r'\.git$','',submodule[2])
|
||||
theme_name = url[19:]
|
||||
theme = session.query(Hugothemes_from_gitlab).filter_by(name=theme_name).first()
|
||||
if theme == None:
|
||||
session.add(Hugothemes_from_gitlab(name=theme_name,url=url,commit_sha=submodule[3]))
|
||||
else:
|
||||
if theme.url != url: theme.url = url
|
||||
if theme.commit_sha != submodule[3]: theme.commit_sha = submodule[3]
|
||||
session.commit()
|
||||
|
||||
gitlab_themes_name_list = get_gitlab_themes_name_list()
|
||||
hugo_themes_from_gitlab_name_list = [theme[0] for theme in session.query(Hugothemes_from_gitlab.name).all()]
|
||||
for theme in hugo_themes_from_gitlab_name_list:
|
||||
if theme not in gitlab_themes_name_list:
|
||||
removed_theme = session.query(Hugothemes_from_gitlab).filter_by(name=theme).first()
|
||||
session.delete(removed_theme)
|
||||
session.commit()
|
||||
|
||||
|
||||
def parse_gitlab_hugo_themes_list():
|
||||
session = sessionmaker(bind=engine)()
|
||||
gitlab_themes_list = get_gitlab_themes_list()
|
||||
for theme in gitlab_themes_list:
|
||||
theme_name = theme[11:]
|
||||
existing_theme = session.query(Hugothemes_from_gitlab).filter_by(name=theme_name).first()
|
||||
if existing_theme is None:
|
||||
session.add(Hugothemes_from_gitlab(name=theme_name, url=theme))
|
||||
session.commit()
|
||||
else:
|
||||
if existing_theme.url != theme:
|
||||
existing_theme.url = theme
|
||||
session.commit()
|
||||
|
||||
|
||||
def parse_hugo_themes_list():
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes_json_string = session.query(Hugothemes.jsondump).filter_by(name=THEMESLISTREPO).first()
|
||||
themes_json = json_loads(themes_json_string[0])
|
||||
for x in themes_json:
|
||||
if x['git_url']:
|
||||
if 'gohugoio' not in x['git_url']:
|
||||
theme_git_url = x['html_url'][:-46]
|
||||
theme_git_name = theme_git_url[19:]
|
||||
theme = session.query(Hugothemes).filter_by(name=theme_git_name).first()
|
||||
if theme == None:
|
||||
session.add(Hugothemes(name=theme_git_name,url=theme_git_url,commit_sha=x['sha']))
|
||||
else:
|
||||
if theme.url != theme_git_url: theme.url = theme_git_url
|
||||
if theme.commit_sha != x['sha']: theme.commit_sha = x['sha']
|
||||
for theme in THEMESLIST:
|
||||
theme_name = theme[11:]
|
||||
existing_theme = session.query(Hugothemes).filter_by(name=theme_name).first()
|
||||
if existing_theme is None:
|
||||
session.add(Hugothemes(name=theme_name, url=theme))
|
||||
session.commit()
|
||||
else:
|
||||
if existing_theme.url != theme:
|
||||
existing_theme.url = theme
|
||||
session.commit()
|
||||
|
||||
|
||||
@ -237,24 +180,24 @@ def get_gitlab_project_ids():
|
||||
match = re.compile(r'(Project ID: )(\d{5,})')
|
||||
for theme in themes:
|
||||
gitlab_theme = session.query(Hugothemes_from_gitlab).filter_by(name=theme).one()
|
||||
if gitlab_theme.gitlab_id == None:
|
||||
response = get(gitlab_theme.url)
|
||||
gitlab_theme.gitlab_id = match.search(response.text).group(2)
|
||||
session.commit()
|
||||
return True
|
||||
if gitlab_theme.gitlab_id is None:
|
||||
response = get(f"https://{gitlab_theme.url}")
|
||||
if response.status_code == 200:
|
||||
gitlab_theme.gitlab_id = match.search(response.text).group(2)
|
||||
session.commit()
|
||||
if response.status_code == 404:
|
||||
print(response.status_code, get_gitlab_project_ids.__name__, theme)
|
||||
print(response.status_code, get_gitlab_project_ids.__name__)
|
||||
|
||||
|
||||
def get_commit_info_for_hugo_themes():
|
||||
session = sessionmaker(bind=engine)()
|
||||
non_github_theme_list = [theme[0] for theme in session.query(Hugothemes_from_gitlab.name).all()]
|
||||
themes = set(theme[0] for theme in session.query(Hugothemes.name).filter(Hugothemes.name!=THEMESLISTREPO).all())
|
||||
for theme in non_github_theme_list:
|
||||
themes -= {theme}
|
||||
for hugo_theme in themes:
|
||||
theme_names_from_github = get_github_themes_name_list()
|
||||
for hugo_theme in theme_names_from_github:
|
||||
theme = session.query(Hugothemes).filter_by(name=hugo_theme).one()
|
||||
api_call_url = 'https://api.github.com/repos/' + theme.name + '/commits/' + theme.commit_sha
|
||||
api_call_url = f'https://api.github.com/repos/{theme.name}/commits/{theme.default_branch}'
|
||||
|
||||
if theme.ETag != None:
|
||||
if theme.ETag is not None:
|
||||
headers['If-None-Match'] = theme.ETag
|
||||
else:
|
||||
if 'If-None-Match' in headers:
|
||||
@ -264,52 +207,58 @@ def get_commit_info_for_hugo_themes():
|
||||
response = get(api_call_url)
|
||||
else:
|
||||
response = get(api_call_url, headers=headers)
|
||||
if response.status_code == 422:
|
||||
print(hugo_theme)
|
||||
quit()
|
||||
if response.status_code == 200:
|
||||
theme.ETag = response.headers['ETag'].lstrip('W/')
|
||||
result = response.json()
|
||||
theme.commit_date = result['commit']['author']['date']
|
||||
theme.commit_date_in_seconds = timegm(strptime(theme.commit_date,'%Y-%m-%dT%H:%M:%SZ'))
|
||||
theme.commit_date_in_seconds = timegm(strptime(theme.commit_date, '%Y-%m-%dT%H:%M:%SZ'))
|
||||
theme.commit_sha = result['commit']['tree']['sha']
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code,get_commit_info_for_hugo_themes.__name__)
|
||||
write_reports()
|
||||
print(response.status_code, get_commit_info_for_hugo_themes.__name__)
|
||||
# write_reports()
|
||||
quit()
|
||||
print(response.status_code,get_commit_info_for_hugo_themes.__name__)
|
||||
|
||||
elif response.status_code == 404:
|
||||
print(response.status_code, get_commit_info_for_hugo_themes.__name__, hugo_theme)
|
||||
print(response.status_code, get_commit_info_for_hugo_themes.__name__)
|
||||
|
||||
|
||||
def get_commit_info_for_hugo_themes_from_gitlab():
|
||||
if get_gitlab_project_ids():
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes = [theme[0] for theme in session.query(Hugothemes_from_gitlab.name).all()]
|
||||
match = re.compile(r'(\.\d{3})(Z$)')
|
||||
for hugo_theme in themes:
|
||||
theme = session.query(Hugothemes_from_gitlab).filter_by(name=hugo_theme).one()
|
||||
api_call_url = 'https://gitlab.com/api/v4/projects/' + theme.gitlab_id + '/repository/commits/' + theme.commit_sha
|
||||
session = sessionmaker(bind=engine)()
|
||||
theme_names_from_gitlab = get_gitlab_themes_name_list()
|
||||
# match = re.compile(r'(\.\d{3})(Z$)')
|
||||
for hugo_theme in theme_names_from_gitlab:
|
||||
theme = session.query(Hugothemes_from_gitlab).filter_by(name=hugo_theme).one()
|
||||
api_call_url = f'https://gitlab.com/api/v4/projects/{theme.gitlab_id}/repository/commits/{theme.default_branch}'
|
||||
|
||||
response = get(api_call_url)
|
||||
if response.status_code == 200:
|
||||
result = response.json()
|
||||
# theme.commit_date = (match.sub(r'\2', result['created_at']))[0:19] + 'Z'
|
||||
theme.commit_date = result['created_at'][0:19] + 'Z'
|
||||
theme.commit_date_in_seconds = timegm(strptime(theme.commit_date, '%Y-%m-%dT%H:%M:%SZ'))
|
||||
theme.commit_sha = result['id']
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code, get_commit_info_for_hugo_themes_from_gitlab.__name__)
|
||||
# write_reports()
|
||||
quit()
|
||||
elif response.status_code == 404:
|
||||
print(response.status_code, get_commit_info_for_hugo_themes_from_gitlab.__name__, hugo_theme)
|
||||
print(response.status_code, get_commit_info_for_hugo_themes_from_gitlab.__name__)
|
||||
|
||||
response = get(api_call_url)
|
||||
if response.status_code == 200:
|
||||
result = response.json()
|
||||
theme.commit_date = (match.sub(r'\2',result['created_at']))[0:19] + 'Z'
|
||||
theme.commit_date_in_seconds = timegm(strptime(theme.commit_date,'%Y-%m-%dT%H:%M:%SZ'))
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code,get_commit_info_for_hugo_themes_from_gitlab.__name__)
|
||||
write_reports()
|
||||
quit()
|
||||
print(response.status_code,get_commit_info_for_hugo_themes_from_gitlab.__name__)
|
||||
|
||||
|
||||
def get_stargazer_count_for_hugo_themes():
|
||||
session = sessionmaker(bind=engine)()
|
||||
non_github_theme_list = [theme[0] for theme in session.query(Hugothemes_from_gitlab.name).all()]
|
||||
themes = set(theme[0] for theme in session.query(Hugothemes.name).filter(Hugothemes.name!=THEMESLISTREPO).all())
|
||||
for theme in non_github_theme_list:
|
||||
themes -= {theme}
|
||||
for hugo_theme in themes:
|
||||
theme_names_from_github = get_github_themes_name_list()
|
||||
for hugo_theme in theme_names_from_github:
|
||||
theme = session.query(Hugothemes).filter_by(name=hugo_theme).one()
|
||||
api_call_url = 'https://api.github.com/repos/' + theme.name
|
||||
|
||||
if theme.repo_ETag != None:
|
||||
if theme.repo_ETag is not None:
|
||||
headers['If-None-Match'] = theme.repo_ETag
|
||||
else:
|
||||
if 'If-None-Match' in headers:
|
||||
@ -323,44 +272,52 @@ def get_stargazer_count_for_hugo_themes():
|
||||
theme.repo_ETag = response.headers['ETag'].lstrip('W/')
|
||||
result = response.json()
|
||||
theme.stargazers_count = result['stargazers_count']
|
||||
theme.default_branch = result['default_branch']
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code,get_stargazer_count_for_hugo_themes.__name__)
|
||||
write_reports()
|
||||
print(response.status_code, get_stargazer_count_for_hugo_themes.__name__)
|
||||
# write_reports()
|
||||
quit()
|
||||
print(response.status_code,get_stargazer_count_for_hugo_themes.__name__)
|
||||
elif response.status_code == 404:
|
||||
print(response.status_code, get_stargazer_count_for_hugo_themes.__name__, hugo_theme)
|
||||
print(response.status_code, get_stargazer_count_for_hugo_themes.__name__)
|
||||
|
||||
|
||||
def get_stargazer_count_for_hugo_themes_from_gitlab():
|
||||
if get_gitlab_project_ids():
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes = [(theme,gitlab_id) for theme,gitlab_id in session.query(Hugothemes_from_gitlab.name,Hugothemes_from_gitlab.gitlab_id).all()]
|
||||
for hugo_theme in themes:
|
||||
theme = session.query(Hugothemes_from_gitlab).filter_by(name=hugo_theme[0]).one()
|
||||
api_call_url = 'https://gitlab.com/api/v4/projects/' + hugo_theme[1]
|
||||
response = get(api_call_url)
|
||||
if response.status_code == 200:
|
||||
result = response.json()
|
||||
if theme.star_count != result['star_count']:
|
||||
theme.star_count = result['star_count']
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code,get_stargazer_count_for_hugo_themes_from_gitlab.__name__)
|
||||
write_reports()
|
||||
quit()
|
||||
print(response.status_code,get_stargazer_count_for_hugo_themes_from_gitlab.__name__)
|
||||
session = sessionmaker(bind=engine)()
|
||||
theme_names_from_gitlab = get_gitlab_themes_name_list()
|
||||
for hugo_theme in theme_names_from_gitlab:
|
||||
theme = session.query(Hugothemes_from_gitlab).filter_by(name=hugo_theme).one()
|
||||
api_call_url = f'https://gitlab.com/api/v4/projects/{theme.gitlab_id}'
|
||||
response = get(api_call_url)
|
||||
if response.status_code == 200:
|
||||
result = response.json()
|
||||
if theme.star_count != result['star_count']:
|
||||
theme.star_count = result['star_count']
|
||||
if theme.default_branch != result['default_branch']:
|
||||
theme.default_branch = result['default_branch']
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code, get_stargazer_count_for_hugo_themes_from_gitlab.__name__)
|
||||
# write_reports()
|
||||
quit()
|
||||
elif response.status_code == 404:
|
||||
print(response.status_code, get_stargazer_count_for_hugo_themes_from_gitlab.__name__, hugo_theme)
|
||||
print(response.status_code, get_stargazer_count_for_hugo_themes_from_gitlab.__name__)
|
||||
|
||||
|
||||
def get_theme_dot_toml_for_each_hugo_themes():
|
||||
session = sessionmaker(bind=engine)()
|
||||
non_github_theme_list = [theme[0] for theme in session.query(Hugothemes_from_gitlab.name).all()]
|
||||
themes = set(theme[0] for theme in session.query(Hugothemes.name).filter(Hugothemes.name!=THEMESLISTREPO).all())
|
||||
for theme in non_github_theme_list: themes -= {theme}
|
||||
for hugo_theme in themes:
|
||||
theme_names_from_github = get_github_themes_name_list()
|
||||
for hugo_theme in theme_names_from_github:
|
||||
theme = session.query(Hugothemes).filter_by(name=hugo_theme).one()
|
||||
api_call_url = "https://api.github.com/repos/"+theme.name+"/contents/theme.toml"
|
||||
if theme.name == 'gcushen/hugo-academic':
|
||||
theme_toml = 'wowchemy/theme.toml'
|
||||
else:
|
||||
theme_toml = 'theme.toml'
|
||||
api_call_url = f"https://api.github.com/repos/{theme.name}/contents/{theme_toml}"
|
||||
|
||||
if theme.themes_toml_ETag != None:
|
||||
if theme.themes_toml_ETag is not None:
|
||||
headers['If-None-Match'] = theme.themes_toml_ETag
|
||||
else:
|
||||
if 'If-None-Match' in headers:
|
||||
@ -376,65 +333,69 @@ def get_theme_dot_toml_for_each_hugo_themes():
|
||||
theme.themes_toml_content = result['content']
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code,get_theme_dot_toml_for_each_hugo_themes.__name__)
|
||||
write_reports()
|
||||
print(response.status_code, get_theme_dot_toml_for_each_hugo_themes.__name__)
|
||||
# write_reports()
|
||||
quit()
|
||||
print(response.status_code,get_theme_dot_toml_for_each_hugo_themes.__name__)
|
||||
elif response.status_code == 404:
|
||||
print(response.status_code, get_theme_dot_toml_for_each_hugo_themes.__name__, hugo_theme)
|
||||
print(response.status_code, get_theme_dot_toml_for_each_hugo_themes.__name__)
|
||||
|
||||
|
||||
def get_theme_dot_toml_for_each_hugo_themes_from_gitlab():
|
||||
if get_gitlab_project_ids():
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes = [(theme,gitlab_id) for theme,gitlab_id in session.query(Hugothemes_from_gitlab.name,Hugothemes_from_gitlab.gitlab_id).all()]
|
||||
for hugo_theme in themes:
|
||||
theme = session.query(Hugothemes_from_gitlab).filter_by(name=hugo_theme[0]).one()
|
||||
api_call_url = 'https://gitlab.com/api/v4/projects/' + hugo_theme[1] + '/repository/files/theme.toml?ref=master'
|
||||
response = get(api_call_url)
|
||||
if response.status_code == 200:
|
||||
result = response.json()
|
||||
theme.themes_toml_content = result['content']
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code,get_theme_dot_toml_for_each_hugo_themes_from_gitlab.__name__)
|
||||
write_reports()
|
||||
quit()
|
||||
print(response.status_code,get_theme_dot_toml_for_each_hugo_themes_from_gitlab.__name__)
|
||||
session = sessionmaker(bind=engine)()
|
||||
theme_names_from_gitlab = get_gitlab_themes_name_list()
|
||||
for hugo_theme in theme_names_from_gitlab:
|
||||
theme = session.query(Hugothemes_from_gitlab).filter_by(name=hugo_theme).one()
|
||||
api_call_url = f'https://gitlab.com/api/v4/projects/{theme.gitlab_id}/repository/files/theme.toml?ref={theme.default_branch}'
|
||||
response = get(api_call_url)
|
||||
if response.status_code == 200:
|
||||
result = response.json()
|
||||
theme.themes_toml_content = result['content']
|
||||
session.commit()
|
||||
elif response.status_code == 403:
|
||||
print(response.status_code, get_theme_dot_toml_for_each_hugo_themes_from_gitlab.__name__)
|
||||
# write_reports()
|
||||
quit()
|
||||
elif response.status_code == 404:
|
||||
print(response.status_code, get_theme_dot_toml_for_each_hugo_themes_from_gitlab.__name__, hugo_theme)
|
||||
print(response.status_code, get_theme_dot_toml_for_each_hugo_themes_from_gitlab.__name__)
|
||||
|
||||
|
||||
def coalesce_themes():
|
||||
if get_gitlab_project_ids():
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes = [theme[0] for theme in session.query(Hugothemes_from_gitlab.name).all()]
|
||||
for hugo_theme in themes:
|
||||
htfgitlab = session.query(Hugothemes_from_gitlab).filter_by(name=hugo_theme).one()
|
||||
theme = session.query(Hugothemes).filter_by(name=hugo_theme).first()
|
||||
if theme == None:
|
||||
session.add(Hugothemes(name=hugo_theme,url=htfgitlab.url,commit_sha=htfgitlab.commit_sha,
|
||||
commit_date=htfgitlab.commit_date,commit_date_in_seconds=htfgitlab.commit_date_in_seconds,
|
||||
stargazers_count=htfgitlab.star_count,themes_toml_content=htfgitlab.themes_toml_content))
|
||||
else:
|
||||
if theme.url != htfgitlab.url: theme.url = htfgitlab.url
|
||||
if theme.commit_sha != htfgitlab.commit_sha: theme.commit_sha = htfgitlab.commit_sha
|
||||
if theme.commit_date != htfgitlab.commit_date: theme.commit_date = htfgitlab.commit_date
|
||||
if theme.commit_date_in_seconds != htfgitlab.commit_date_in_seconds:
|
||||
theme.commit_date_in_seconds = htfgitlab.commit_date_in_seconds
|
||||
if theme.stargazers_count != htfgitlab.star_count: theme.stargazers_count = htfgitlab.star_count
|
||||
theme.themes_toml_content = htfgitlab.themes_toml_content
|
||||
session.commit()
|
||||
session = sessionmaker(bind=engine)()
|
||||
theme_names_from_gitlab = get_gitlab_themes_name_list()
|
||||
for hugo_theme in theme_names_from_gitlab:
|
||||
htfgitlab = session.query(Hugothemes_from_gitlab).filter_by(name=hugo_theme).one()
|
||||
theme = session.query(Hugothemes).filter_by(name=hugo_theme).first()
|
||||
if theme is None:
|
||||
session.add(Hugothemes(
|
||||
name=hugo_theme, url=htfgitlab.url, commit_sha=htfgitlab.commit_sha,
|
||||
commit_date=htfgitlab.commit_date, commit_date_in_seconds=htfgitlab.commit_date_in_seconds,
|
||||
stargazers_count=htfgitlab.star_count, themes_toml_content=htfgitlab.themes_toml_content
|
||||
))
|
||||
else:
|
||||
if theme.url != htfgitlab.url: theme.url = htfgitlab.url
|
||||
if theme.commit_sha != htfgitlab.commit_sha: theme.commit_sha = htfgitlab.commit_sha
|
||||
if theme.commit_date != htfgitlab.commit_date: theme.commit_date = htfgitlab.commit_date
|
||||
if theme.commit_date_in_seconds != htfgitlab.commit_date_in_seconds:
|
||||
theme.commit_date_in_seconds = htfgitlab.commit_date_in_seconds
|
||||
if theme.stargazers_count != htfgitlab.star_count: theme.stargazers_count = htfgitlab.star_count
|
||||
theme.themes_toml_content = htfgitlab.themes_toml_content
|
||||
session.commit()
|
||||
|
||||
|
||||
def update_tags_list_for_each_hugo_themes():
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes = [theme[0] for theme in session.query(Hugothemes.name).filter(Hugothemes.name!=THEMESLISTREPO).all()]
|
||||
themes = [theme[0] for theme in session.query(Hugothemes.name).filter(Hugothemes.name != THEMESLISTREPO).all()]
|
||||
match = re.compile(r'\s(\d+\.\d+\.\d+)\s')
|
||||
for hugo_theme in themes:
|
||||
theme = session.query(Hugothemes).filter_by(name=hugo_theme).one()
|
||||
if theme.themes_toml_content != None:
|
||||
if theme.themes_toml_content is not None:
|
||||
content = b64decode(theme.themes_toml_content).decode('utf-8')
|
||||
# put quotes around any unquoted double-dotted version numbers
|
||||
# (and add a newline afterwards)
|
||||
# because python toml libraries will error out on those
|
||||
theme_toml = toml.loads(match.sub(r'"\1"\n',content))
|
||||
theme_toml = toml.loads(match.sub(r'"\1"\n', content))
|
||||
if 'tags' in theme_toml:
|
||||
if len(theme_toml['tags']) > 0:
|
||||
theme_tags = [tag.lower() for tag in theme_toml['tags'] if len(tag) > 0]
|
||||
@ -442,26 +403,26 @@ def update_tags_list_for_each_hugo_themes():
|
||||
if theme.num_tags > 0:
|
||||
if theme.tags_list != str(theme_tags): theme.tags_list = str(theme_tags)
|
||||
else:
|
||||
if theme.tags_list != None: theme.tags_list = None
|
||||
if theme.tags_list is not None: theme.tags_list = None
|
||||
else:
|
||||
if theme.tags_list != None: theme.tags_list = None
|
||||
if theme.tags_list is not None: theme.tags_list = None
|
||||
if theme.num_tags != 0: theme.num_tags = 0
|
||||
else:
|
||||
if theme.tags_list != None: theme.tags_list = None
|
||||
if theme.tags_list is not None: theme.tags_list = None
|
||||
if theme.num_tags != 0: theme.num_tags = 0
|
||||
else:
|
||||
if theme.tags_list != None: theme.tags_list = None
|
||||
if theme.tags_list is not None: theme.tags_list = None
|
||||
if theme.num_tags != 0: theme.num_tags = 0
|
||||
session.commit()
|
||||
|
||||
|
||||
def update_tag_table():
|
||||
session = sessionmaker(bind=engine)()
|
||||
themes = [(theme,tags_list) for theme,tags_list in session.query(Hugothemes.name,Hugothemes.tags_list)
|
||||
.filter(Hugothemes.name!=THEMESLISTREPO).all()]
|
||||
themes = [(theme, tags_list) for theme, tags_list in session.query(
|
||||
Hugothemes.name, Hugothemes.tags_list).filter(Hugothemes.name != THEMESLISTREPO).all()]
|
||||
tags_list = set()
|
||||
for theme in themes:
|
||||
if theme[1] != None:
|
||||
if theme[1] is not None:
|
||||
tags = literal_eval(theme[1])
|
||||
for tag in tags:
|
||||
if len(tag) > 0:
|
||||
@ -470,15 +431,15 @@ def update_tag_table():
|
||||
for hugo_tag in tags_list:
|
||||
theme_list = []
|
||||
for theme in themes:
|
||||
if theme[1] != None:
|
||||
if theme[1] is not None:
|
||||
tags = literal_eval(theme[1])
|
||||
if hugo_tag in tags:
|
||||
theme_list.append(theme[0])
|
||||
tag = session.query(Tags).filter_by(tag=hugo_tag).first()
|
||||
if tag == None:
|
||||
session.add(Tags(tag=hugo_tag,theme_list=str(theme_list),num_themes=len(theme_list)))
|
||||
if tag is None:
|
||||
session.add(Tags(tag=hugo_tag, theme_list=str(theme_list), num_themes=len(theme_list)))
|
||||
else:
|
||||
theme_list,num_themes = str(theme_list),len(theme_list)
|
||||
theme_list, num_themes = str(theme_list), len(theme_list)
|
||||
if tag.theme_list != theme_list: tag.theme_list = theme_list
|
||||
if tag.num_themes != num_themes: tag.num_themes = num_themes
|
||||
session.commit()
|
||||
@ -506,71 +467,72 @@ def make_table(themes_info):
|
||||
table = "\t<div class='container'>\n\t\t<table class='table monospace'>\n\t\t\t<thead><tr><th scope='col'>" + themes_info[1] + " (tag) " + themes_info[2] + "</th><th scope='col'>Date</th></tr></thead>\n\t\t\t<tbody>\n"
|
||||
for theme in themes_info[0]:
|
||||
name = theme[0].split('/')[1]
|
||||
row = "\t\t\t\t<tr><td scope='row'>"+"<a target='_blank' href='"+theme[4]+"'>"+name+"</a>""</td>"
|
||||
row += "<td nowrap>"+theme[2][:10]+"</td>"
|
||||
row += "<td align='right' nowrap style='padding-left:1em;'>"+str(theme[3])+'★'+"</td>"
|
||||
row += "<td align='right' style='padding-left:1em;'>"+theme[1][:6]+"</td></tr>\n"
|
||||
row = "\t\t\t\t<tr><td scope='row'>" + "<a target='_blank' href='" + theme[4] + "'>" + name + "</a>""</td>"
|
||||
row += "<td nowrap>" + theme[2][:10] + "</td>"
|
||||
row += "<td align='right' nowrap style='padding-left:1em;'>" + str(theme[3]) + '★' + "</td>"
|
||||
row += "<td align='right' style='padding-left:1em;'>" + theme[1][:6] + "</td></tr>\n"
|
||||
table += row
|
||||
table += "\t\t\t</tbody>\n\t\t</table>\n\t</div>\n"
|
||||
table += "\t\t\t</tbody>\n\t\t</table>\n\t</div>\n"
|
||||
return table
|
||||
|
||||
|
||||
def make_section(section_info):
|
||||
if section_info[3] > 10:
|
||||
section = make_nav_buttons((section_info[0],'by-date',section_info[3]))
|
||||
section += make_table((section_info[1],section_info[0],'by-date'))
|
||||
section += make_nav_buttons((section_info[0],'by-stars',section_info[3]))
|
||||
section += make_table((section_info[2],section_info[0],'by-stars'))
|
||||
section = make_nav_buttons((section_info[0], 'by-date', section_info[3]))
|
||||
section += make_table((section_info[1], section_info[0], 'by-date'))
|
||||
section += make_nav_buttons((section_info[0], 'by-stars', section_info[3]))
|
||||
section += make_table((section_info[2], section_info[0], 'by-stars'))
|
||||
else:
|
||||
section = make_nav_buttons((section_info[0],'by-date',section_info[3]))
|
||||
section += make_table((section_info[1],section_info[0],'by-date'))
|
||||
section = make_nav_buttons((section_info[0], 'by-date', section_info[3]))
|
||||
section += make_table((section_info[1], section_info[0], 'by-date'))
|
||||
return section
|
||||
|
||||
|
||||
def write_reports():
|
||||
session = sessionmaker(bind=engine)()
|
||||
u,v,w,x,y,z = Hugothemes.name,Hugothemes.commit_sha,Hugothemes.commit_date,Hugothemes.stargazers_count,Hugothemes.url,Hugothemes.commit_date_in_seconds
|
||||
themes_bydate_list = [(vals) for (vals) in session.query(u,v,w,x,y).filter(Hugothemes.name!=THEMESLISTREPO).order_by(z.desc())]
|
||||
themes_bystars_list = [(vals) for (vals) in session.query(u,v,w,x,y).filter(Hugothemes.name!=THEMESLISTREPO).order_by(x.desc())]
|
||||
u, v, w, x, y, z = Hugothemes.name, Hugothemes.commit_sha, Hugothemes.commit_date, Hugothemes.stargazers_count, Hugothemes.url, Hugothemes.commit_date_in_seconds
|
||||
themes_bydate_list = [(vals) for (vals) in session.query(u, v, w, x, y).filter(Hugothemes.name != THEMESLISTREPO).order_by(z.desc())]
|
||||
themes_bystars_list = [(vals) for (vals) in session.query(u, v, w, x, y).filter(Hugothemes.name != THEMESLISTREPO).order_by(x.desc())]
|
||||
themes = [theme[0] for theme in themes_bystars_list]
|
||||
tags_list = [('all',str(themes),len(themes))]
|
||||
tags_list += [(vals) for (vals) in session.query(Tags.tag,Tags.theme_list,Tags.num_themes).filter(Tags.num_themes > 2).order_by(Tags.num_themes.desc())]
|
||||
tags_list = [('all', str(themes), len(themes))]
|
||||
tags_list += [(vals) for (vals) in session.query(Tags.tag, Tags.theme_list, Tags.num_themes).filter(Tags.num_themes > 2).order_by(Tags.num_themes.desc())]
|
||||
|
||||
reportpage = "<!DOCTYPE html>\n<html lang='en'>\n"
|
||||
reportpage += "\t<head>\n\t\t<title>Hugo Themes Report</title>\n\t\t<meta charset='utf-8'>"
|
||||
reportpage += "\n\t\t<meta name='viewport' content='width=device-width, initial-scale=1'>\n"
|
||||
reportpage += "\t\t<link rel='stylesheet' href='https://maxcdn.bootstrapcdn.com/bootstrap/4.0.0/css/bootstrap.min.css' "
|
||||
reportpage += "integrity='sha384-Gn5384xqQ1aoWXA+058RXPxPg6fy4IWvTNh0E263XmFcJlSAwiGgFAW/dAiS6JXm' crossorigin='anonymous'>\n\t</head>\n"
|
||||
reportpage += "\t<body>\n"
|
||||
reportpage += "\t<body>\n"
|
||||
|
||||
reportpage += make_section(('all',themes_bydate_list,themes_bystars_list,len(themes_bydate_list)))
|
||||
reportpage += make_section(('all', themes_bydate_list, themes_bystars_list, len(themes_bydate_list)))
|
||||
reportpage += make_buttons(tags_list)
|
||||
for tag in tags_list[1:]:
|
||||
tag_theme_list = literal_eval(tag[1])
|
||||
bydate_list = [theme for theme in themes_bydate_list if theme[0] in tag_theme_list]
|
||||
bystars_list = [theme for theme in themes_bystars_list if theme[0] in tag_theme_list]
|
||||
reportpage += make_section((tag[0],bydate_list,bystars_list,tag[2]))
|
||||
reportpage += make_section((tag[0], bydate_list, bystars_list, tag[2]))
|
||||
|
||||
reportpage += "\t</body>"
|
||||
reportpage += "\t</body>"
|
||||
reportpage += "\n</html>"
|
||||
by_date = open('hugo-themes-report/hugo-themes-report.html','w')
|
||||
by_date = open('hugo-themes-report/hugo-themes-report.html', 'w')
|
||||
by_date.write(reportpage)
|
||||
by_date.close()
|
||||
|
||||
|
||||
if __name__=="__main__":
|
||||
if __name__ == "__main__":
|
||||
get_hugo_themes_list()
|
||||
update_hugo_themes_submodule_list()
|
||||
clean_up()
|
||||
parse_submodules_from_gitlab()
|
||||
parse_hugo_themes_list()
|
||||
get_commit_info_for_hugo_themes()
|
||||
get_commit_info_for_hugo_themes_from_gitlab()
|
||||
get_stargazer_count_for_hugo_themes()
|
||||
get_stargazer_count_for_hugo_themes_from_gitlab()
|
||||
get_theme_dot_toml_for_each_hugo_themes()
|
||||
get_theme_dot_toml_for_each_hugo_themes_from_gitlab()
|
||||
coalesce_themes()
|
||||
update_tags_list_for_each_hugo_themes()
|
||||
update_tag_table()
|
||||
write_reports()
|
||||
if len(THEMESLIST) > 300:
|
||||
clean_up()
|
||||
parse_hugo_themes_list()
|
||||
parse_gitlab_hugo_themes_list()
|
||||
get_gitlab_project_ids()
|
||||
get_stargazer_count_for_hugo_themes()
|
||||
get_stargazer_count_for_hugo_themes_from_gitlab()
|
||||
get_commit_info_for_hugo_themes()
|
||||
get_commit_info_for_hugo_themes_from_gitlab()
|
||||
get_theme_dot_toml_for_each_hugo_themes()
|
||||
get_theme_dot_toml_for_each_hugo_themes_from_gitlab()
|
||||
coalesce_themes()
|
||||
update_tags_list_for_each_hugo_themes()
|
||||
update_tag_table()
|
||||
write_reports()
|
||||
|
Loading…
Reference in New Issue
Block a user