Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Collect pandoc urls from github api #372

Open
wants to merge 6 commits into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 2 additions & 1 deletion .github/workflows/ci.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -45,7 +45,7 @@ jobs:
run: poetry install
if: steps.cached-poetry-dependencies.outputs.cache-hit != 'true'
- name: Download pandoc
run: poetry run python setup_binary.py download_pandoc
run: GITHUB_TOKEN=${{ secrets.GITHUB_TOKEN }} poetry run python setup_binary.py download_pandoc
- name: run tests
run: poetry run python tests.py

Expand Down Expand Up @@ -89,6 +89,7 @@ jobs:
- name: Build binary Archive
uses: pypa/[email protected]
env:
GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
CIBW_BEFORE_ALL: "python3 -m pip install --break-system-packages setuptools && mv setup_binary.py setup.py && python3 setup.py download_pandoc"
CIBW_BUILD: cp39-* # Build any 1 python version as this wheel is not version dependent
# We skip some variants because:
Expand Down
2 changes: 1 addition & 1 deletion pypandoc/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@
__author_email__ = "[email protected]"
__maintainer__ = u'Jessica Tegner'
__url__ = 'https://github.com/JessicaTegner/pypandoc'
__version__ = '1.14'
__version__ = '1.15'
__license__ = 'MIT'
__description__ = "Thin wrapper for pandoc."
__python_requires__ = ">=3.7"
Expand Down
55 changes: 33 additions & 22 deletions pypandoc/pandoc_download.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,5 @@
# -*- coding: utf-8 -*-

import logging
import json
import os
import os.path
import platform
Expand All @@ -13,9 +12,11 @@

import urllib
try:
from urllib.request import urlopen
from urllib.request import urlopen, Request
from urllib.parse import urlparse
except ImportError:
from urllib import urlopen
from urllib2 import urlopen, Request
from urlparse import urlparse

from .handler import logger, _check_log_handler

Expand All @@ -42,36 +43,46 @@ def _get_pandoc_urls(version="latest"):
:return: str version: actual pandoc version. (e.g. "latest" will be resolved to the actual one)
"""
# url to pandoc download page
url = "https://github.com/jgm/pandoc/releases/" + \
("tag/" if version != "latest" else "") + version
url = "https://api.github.com/repos/jgm/pandoc/releases/" + \
("tags/" if version != "latest" else "") + version
github_token = os.getenv("GITHUB_TOKEN")
if github_token:
headers = {
"Authorization": f"Bearer {github_token}"
}
src = Request(url, headers=headers)
else:
src = url
# try to open the url
try:
response = urlopen(url)
version_url_frags = response.url.split("/")
version = version_url_frags[-1]
response = urlopen(src)
except urllib.error.HTTPError as e:
raise RuntimeError("Invalid pandoc version {}.".format(version))
return
# read the HTML content
response = urlopen(f"https://github.com/jgm/pandoc/releases/expanded_assets/{version}")
content = response.read()
# read json response
data = json.loads(response.read())
# regex for the binaries
uname = platform.uname()[4]
processor_architecture = "arm" if uname.startswith("arm") or uname.startswith("aarch") else "amd"
regex = re.compile(fr"/jgm/pandoc/releases/download/.*(?:{processor_architecture}|x86|mac).*\.(?:msi|deb|pkg)")
# a list of urls to the binaries
pandoc_urls_list = regex.findall(content.decode("utf-8"))
processor_architecture = (
"arm" if uname.startswith("arm") or uname.startswith("aarch") else "amd"
)
regex = re.compile(
rf"/jgm/pandoc/releases/download/.*(?:{processor_architecture}|x86|mac)"
r".*\.(?:msi|deb|pkg)"
)
# actual pandoc version
version = pandoc_urls_list[0].split('/')[5]
version = data["tag_name"]
# dict that lookup the platform from binary extension
ext2platform = {
'msi': 'win32',
'deb': 'linux',
'pkg': 'darwin'
}
# parse pandoc_urls from list to dict
# py26 don't like dict comprehension. Use this one instead when py26 support is dropped
pandoc_urls = {ext2platform[url_frag[-3:]]: (f"https://github.com{url_frag}") for url_frag in pandoc_urls_list}
}
# collect pandoc urls from json content
pandoc_urls = dict()
for asset in data["assets"]:
download_url = asset["browser_download_url"]
if regex.match(urlparse(download_url).path):
pandoc_urls[ext2platform.get(asset["name"][-3:])] = download_url
return pandoc_urls, version


Expand Down
2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
[tool.poetry]
name = "pypandoc"
version = "1.14"
version = "1.15"
description = "Thin wrapper for pandoc"
authors = ["JessicaTegner <jessica.tegneroutlook.com>"]
license = "MIT"
Expand Down