-
-
Notifications
You must be signed in to change notification settings - Fork 17
/
Copy pathget_biocontainers.py
executable file
·56 lines (40 loc) · 1.35 KB
/
get_biocontainers.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#!/usr/bin/env python3
import argparse
import os
import requests
from bs4 import BeautifulSoup
# .github/scripts
here = os.path.abspath(os.path.dirname(__file__))
root = os.path.dirname(os.path.dirname(here))
def get_parser():
parser = argparse.ArgumentParser(
description="BioContainer Lister",
formatter_class=argparse.RawTextHelpFormatter,
)
parser.add_argument(
"filename", help="Path to filename to write container listing to."
)
return parser
def main():
parser = get_parser()
# If an error occurs while parsing the arguments, the interpreter will exit with value 2
args, extra = parser.parse_known_args()
# Show args to the user
print("filename: %s" % args.filename)
response = requests.get("https://depot.galaxyproject.org/singularity/")
soup = BeautifulSoup(response.text, "html.parser")
links = soup.find_all("a")
images = set()
# Use the latest for each unique
for link in links:
if ":" not in link.text:
continue
image, tag = link.text.split(":", 1)
images.add(image)
print("Found %s BioContainers images" % len(images))
# Write skips back to file for faster parsing
with open(args.filename, "w") as fd:
for image in sorted(list(images)):
fd.write(image + "\n")
if __name__ == "__main__":
main()