diff --git a/.github/workflows/release.yaml b/.github/workflows/release.yaml index f3e7dff..84f6233 100644 --- a/.github/workflows/release.yaml +++ b/.github/workflows/release.yaml @@ -28,6 +28,7 @@ jobs: zenodo_json: .zenodo.json archive: ${{ env.archive }} token: ${{ secrets.ZENODO_TOKEN }} + doi: 10.5281/zenodo.6326822 - name: View Outputs env: @@ -50,4 +51,3 @@ jobs: echo "latest html ${latest_html}" echo "record ${record}" echo "record html ${record_html}" - diff --git a/README.md b/README.md index 59ea590..8862dc4 100644 --- a/README.md +++ b/README.md @@ -37,10 +37,24 @@ I think this is kind of silly, but that's just me. ## Usage +When looking at artifacts in Zenodo you'll see a versions card like the image below. This artifact has +only one version, 0.0.15. By default, this is the behavior of this action - to create brand new artifacts +with only one version. + +If, however, you'd like to make new versions you can specify the doi that represents *all* +versions. In this image you would specify `10.5281/zenodo.6326822`. This action will then +create new versions tied to this DOI. + +![Zenodo card for versions. '0.0.15' is the only version and a DOI of 10.5281/zenodo.6326823. The footer of the card has a site all versions with DOI 10.5281/zenodo.6326822](img/zenodo_versions.png) + ### GitHub Action -After you complete the steps above to create the metadata file, you might create a release -action as follows: +After you complete the steps above to create the metadata file, you have two options. + +#### Existing DOI + +If you have an existing DOI that is of the **all versions** type meaning we can update it, you should provide it to the action. +The example below shows running a release workflow and providing an archive to update to a new version (**released under the same DOI**) ```yaml name: Zenodo Release @@ -68,13 +82,73 @@ jobs: with: token: ${{ secrets.ZENODO_TOKEN }} version: ${{ github.event.release.tag_name }} - zenodo_json: .zenodo.json + zenodo_json: .zenodo.json # optional archive: ${{ env.archive }} + + # Optional DOI for all versions. Leaving this blank (the default) will create + # a new DOI on every release. Use a DOI that represents all versions will + # create a new version for this existing DOI. + # + # Newer versions have their own DOIs, but they're also linked to this DOI + # as a different version. When using this, use the DOI for all versions. + doi: '10.5281/zenodo.6326822' ``` -Notice how we are choosing to use the .tar.gz (you could use the zip too at `${{ github.event.release.zipball_url }}`) -and using the default zenodo.json that is obtained from the checked out repository. +Notice how we are choosing to use the .tar.gz (you could use the zip too at `${{ github.event.release.zipball_url }}`). +Note that the "zenodo.json" is optional only if you've already created the record with some metadata. If you provide it, +it will be used to update metadata found with the previous upload. If you don't provide it, the previous upload will +only be updated for the date and version. Note that we are considering adding an ability to upload from new authors found +in the commit history, but this is not implemented yet. + +#### New DOI + +If you want to be creating fresh DOIs and releases (with no shared DOI for all versions) for each one, just remove the doi variable. Note +that for this case, the .zenodo.json is required as there isn't a previous record to get it from. + +```yaml +name: Zenodo Release + +on: + release: + types: [published] + +jobs: + deploy: + runs-on: ubuntu-20.04 + + steps: + - uses: actions/checkout@v3 + - name: download archive to runner + env: + tarball: ${{ github.event.release.tarball_url }} + run: | + name=$(basename ${tarball}) + curl -L $tarball > $name + echo "archive=${name}" >> $GITHUB_ENV + + - name: Run Zenodo Deploy + uses: rseng/zenodo-release@main + with: + token: ${{ secrets.ZENODO_TOKEN }} + version: ${{ github.event.release.tag_name }} + zenodo_json: .zenodo.json # required + archive: ${{ env.archive }} +``` + +#### Archives + +For both of the above, instead of an exact archive path you can also use a pattern to give to Python's `glob.glob`. E.g.,: + +```yaml + with: + archive: "files/*.tar.gz" +``` + +Note that we will be testing support for more than one path or pattern soon. We also grab the version as the release tag. We are also running on the publication of a release. + +#### Outputs + If you want to see or do something with the outputs, add an `id` to the deploy step and do: ```yaml @@ -119,7 +193,7 @@ the following: ```bash export ZENODO_TOKEN=xxxxxxxxxxxxxxxxxxxx - # archive # identifier # version -$ python scripts/deploy.py upload 0.0.0.tar.gz 6326700 --version 0.0.0 + # archive # multi-version DOI # new version +$ python scripts/deploy.py upload 0.0.0.tar.gz --doi 10.5281/zenodo.6326822 --version 0.0.0 ``` diff --git a/action.yml b/action.yml index e275d34..1a266e7 100644 --- a/action.yml +++ b/action.yml @@ -12,6 +12,8 @@ inputs: required: true zenodo_json: description: Path to zenodo.json to upload with metadata (must exist) + doi: + descripton: The DOI to create a new version from outputs: badge: @@ -54,5 +56,16 @@ runs: version: ${{ inputs.version }} ACTION_PATH: ${{ github.action_path }} ZENODO_TOKEN: ${{ inputs.token }} - run: python ${{ github.action_path }}/scripts/deploy.py upload ${archive} --zenodo-json ${zenodo_json} --version ${version} + doi: ${{ inputs.doi }} + run: | + command="python ${{ github.action_path }}/scripts/deploy.py upload ${archive} --version ${version}" + if [[ "${doi}" != "" ]]; then + command="$command --doi ${doi}" + fi + if [[ "${zenodo_json}" != "" ]]; then + command="$command --zenodo-json ${zenodo_json}" + fi + printf "$command\n" + $command + shell: bash diff --git a/img/zenodo_versions.png b/img/zenodo_versions.png new file mode 100644 index 0000000..dacef5f Binary files /dev/null and b/img/zenodo_versions.png differ diff --git a/scripts/deploy.py b/scripts/deploy.py index d83a180..1eb5894 100644 --- a/scripts/deploy.py +++ b/scripts/deploy.py @@ -10,6 +10,7 @@ import os import json import sys +from glob import glob from datetime import datetime import requests @@ -27,81 +28,231 @@ def read_json(filename): ZENODO_TOKEN = os.environ.get("ZENODO_TOKEN") -ZENODO_HOST = "zenodo.org" if not ZENODO_TOKEN: sys.exit("A ZENODO_TOKEN is required to be exported in the environment!") -def upload_archive(archive, zenodo_json, version): +class Zenodo: """ - Upload an archive to zenodo + Zenodo client to handle shared API calls. """ - archive = os.path.abspath(archive) - if not os.path.exists(archive): - sys.exit("Archive %s does not exist." % archive) - headers = {"Accept": "application/json"} - params = {"access_token": ZENODO_TOKEN} + def __init__(self, sandbox=False): + self.headers = {"Accept": "application/json"} + self.params = {"access_token": ZENODO_TOKEN} + self.set_host(sandbox) - # Create an empty upload - response = requests.post( - "https://zenodo.org/api/deposit/depositions", - params=params, - json={}, - headers=headers, - ) - if response.status_code not in [200, 201]: - sys.exit( - "Trouble requesting new upload: %s, %s" - % (response.status_code, response.json()) + def set_host(self, sandbox=False): + """ + Given a preference for sandbox (or not) set the API host + """ + self.host = "zenodo.org" + if sandbox: + self.host = "sandbox.zenodo.org" + + def get(self, url): + """ + Wrapper to get to handle adding host and adding params or headers + """ + if not url.startswith("http"): + url = "https://%s%s" % (self.host, url) + return requests.get(url, params=self.params, headers=self.headers) + + def post(self, url): + """ + Wrapper to post to handle adding host and adding params or headers + """ + if not url.startswith("http"): + url = "https://%s%s" % (self.host, url) + return requests.post(url, params=self.params, headers=self.headers) + + def get_depositions(self): + """ + Get all current depositions. + """ + response = self.get("/api/deposit/depositions") + if response.status_code not in [200, 201]: + sys.exit( + "Cannot query depositions: %s, %s" + % (response.status_code, response.json()) + ) + return response.json() + + def find_deposit(self, doi): + """ + Given a doi, find the deposit, return None if no match + """ + deposits = self.get_depositions() + + # Look for the matching DOI + target_deposit = None + for deposit in deposits: + if "doi" not in deposit: + continue + print("looking at deposit %s" % deposit["doi"]) + if deposit["conceptdoi"] == doi: + print("Found deposit %s! 🎉️" % doi) + target_deposit = deposit + break + + return target_deposit + + def new_doi(self): + """ + Create a new (empty) upload for a DOI + """ + response = requests.post( + "https://zenodo.org/api/deposit/depositions", + params=params, + json={}, + headers=headers, ) + if response.status_code not in [200, 201]: + sys.exit( + "Trouble requesting new upload: %s, %s" + % (response.status_code, response.json()) + ) + return response.json() + + def update_doi(self, doi): + """ + Given an existing DOI, update with a new archives (or pattern of files). + """ + target_deposit = self.find_deposit(doi) + if not target_deposit: + sys.exit( + "Cannot find deposit with doi: '%s'. Are you currently editing it?" + % doi + ) + + # If we have an unpublished draft - continue working onit + if not target_deposit["submitted"]: + draft = target_deposit + else: + # found the existing deposit - so let's make a new version. + response = self.post( + "%s/actions/newversion" % target_deposit["links"]["self"] + ) + if response.status_code not in [200, 201]: + sys.exit( + "Cannot create a new version for doi '%s'. %s" + % (doi, response.json()) + ) + draft = response.json() + + # this is actually the next draft. cannot edit the existing doi above + response = self.get(draft["links"]["latest_draft"]) + if response.status_code not in [200, 201]: + sys.exit("Cannot create a draft for doi '%s'. %s" % (doi, response.json())) + new_version = response.json() + + # this draft is based off of version N-1, so let's remove N-1's artifacts to make room + # for version N. + for file in new_version.get("files", []): + response = requests.delete( + file["links"]["self"], params=self.params, headers=self.headers + ) + if response.status_code not in [200, 204]: + print( + "could not delete file %s: %s" % (file["filename"], response.json()) + ) + return new_version + + def upload_archive(self, upload, archive): + """ + Given an upload response and archive, upload the new file! + """ + # Using requests files indicates multipart/form-data + # Here we are uploading the new release file + url = "https://zenodo.org/api/deposit/depositions/%s/files" % upload["id"] + bucket_url = upload["links"]["bucket"] + + with open(archive, "rb") as fp: + response = requests.put( + "%s/%s" % (bucket_url, os.path.basename(archive)), + data=fp, + params=self.params, + ) + if response.status_code != 200: + sys.exit("Trouble uploading artifact %s to bucket" % archive) + + def publish(self, data): + """ + Given a data response from a new metadata upload, publish it. + """ + publish_url = data["links"]["publish"] + r = requests.post(publish_url, params=self.params) + if r.status_code not in [200, 201, 202]: + sys.exit("Issue publishing record: %s, %s" % (r.status_code, r.json())) + + published = r.json() + print("::group::Record") + print(json.dumps(published, indent=4)) + print("::endgroup::") + for k, v in published["links"].items(): + print("::set-output name=%s::%s" % (k, v)) - upload = response.json() + def upload_metadata(self, upload, zenodo_json, version): + """ + Given an upload response and zenodo json, upload new data - # Using requests files indicates multipart/form-data - # Here we are uploading the new release file - url = "https://zenodo.org/api/deposit/depositions/%s/files" % upload["id"] - bucket_url = upload["links"]["bucket"] + Note that if we don't have a zenodo.json we could use the old one. + """ + metadata = upload["metadata"] - with open(archive, "rb") as fp: + # updates from zenodo.json + if zenodo_json: + metadata.update(read_json(zenodo_json)) + metadata["version"] = version + metadata["publication_date"] = str(datetime.now()) + + # New .zenodo.json may be missing this + if "upload_type" not in metadata: + metadata["upload_type"] = "software" + self.headers.update({"Content-Type": "application/json"}) + + # Make the deposit! + url = "https://zenodo.org/api/deposit/depositions/%s" % upload["id"] response = requests.put( - "%s/%s" % (bucket_url, os.path.basename(archive)), - data=fp, - params=params, + url, + data=json.dumps({"metadata": metadata}), + params=self.params, + headers=self.headers, ) if response.status_code != 200: - sys.exit("Trouble uploading artifact %s to bucket" % archive) + sys.exit( + "Trouble uploading metadata %s, %s" % response.status_code, + response.json(), + ) + return response.json() - # Finally, load .zenodo.json and add version - metadata = read_json(zenodo_json) - metadata["version"] = version - metadata["publication_date"] = str(datetime.now()) - if "upload_type" not in metadata: - metadata["upload_type"] = "software" - url = "https://zenodo.org/api/deposit/depositions/%s" % upload["id"] - headers["Content-Type"] = "application/json" - response = requests.put( - url, data=json.dumps({"metadata": metadata}), params=params, headers=headers - ) - if response.status_code != 200: - sys.exit( - "Trouble uploading metadata %s, %s" % response.status_code, response.json() - ) - data = response.json() - publish_url = data["links"]["publish"] - r = requests.post(publish_url, params=params) - if r.status_code not in [200, 201, 202]: - sys.exit( - "Issue publishing record: %s, %s" % (response.status_code, response.json()) - ) +def upload_archive(archive, version, zenodo_json=None, doi=None, sandbox=False): + """ + Upload an archive to an existing Zenodo "versions DOI" + """ + archive = os.path.abspath(archive) + if not os.path.exists(archive): + sys.exit("Archive %s does not exist." % archive) + + cli = Zenodo(sandbox=sandbox) + + if doi: + upload = cli.update_doi(doi=doi) + else: + if not zenodo_json: + sys.exit("You MUST provided a .zenodo.json template to create a new DOI.") + upload = cli.new_doi() + + # Use a glob matching pattern to upload new files (also ensures exist) + for path in glob(archive): + cli.upload_archive(upload, path) - published = r.json() - print("::group::Record") - print(json.dumps(published, indent=4)) - print("::endgroup::") - for k, v in published["links"].items(): - print("::set-output name=%s::%s" % (k, v)) + # Finally, load .zenodo.json and add version + data = cli.upload_metadata(upload, zenodo_json, version) + + # Finally, publish + cli.publish(data) def get_parser(): @@ -118,9 +269,9 @@ def get_parser(): "--zenodo-json", dest="zenodo_json", help="path to .zenodo.json (defaults to .zenodo.json)", - default=".zenodo.json", ) upload.add_argument("--version", help="version to upload") + upload.add_argument("--doi", help="an existing DOI to add a new version to") return parser @@ -136,18 +287,24 @@ def help(return_code=0): if not args.command: help() - if not args.zenodo_json or not os.path.exists(args.zenodo_json): - sys.exit( - "You must provide an existing .zenodo.json as the first positional argument." - ) + if args.zenodo_json and not os.path.exists(args.zenodo_json): + sys.exit("%s does not exist." % args.zenodo_json) if not args.archive: sys.exit("You must provide an archive as the second positional argument.") if not args.version: sys.exit("You must provide a software version to upload.") - # Prepare drafts if args.command == "upload": - upload_archive(args.archive, args.zenodo_json, args.version) + upload_archive( + archive=args.archive, + zenodo_json=args.zenodo_json, + version=args.version, + doi=args.doi, + ) + + # We should not get here :) + else: + sys.exit("Unrecognized command %s" % args.command) if __name__ == "__main__":