-
-
Notifications
You must be signed in to change notification settings - Fork 238
/
Copy pathscrape_hexpm.sh
executable file
·46 lines (31 loc) · 1.24 KB
/
scrape_hexpm.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
#!/usr/bin/sh
# This script will scrape packages from hex.pm that are believed to be
# Erlang packages. We do this by first walking through all packages and
# then getting the most recent release of each package. If the build tools
# listed contain "rebar3" we keep them and write the package
# name and version to a file.
#
# This script should only be run occasionally to refresh the file
# containing the list of packages.
#
# @todo Some of the projects fetched are Elixir despite indicating
# "rebar3" or "make". We should ignore them here once identified
# so they don't make it to the output.
NUM=1
while true; do
echo "# Packages page $NUM"
PAGE=$(curl -s "https://hex.pm/api/packages?sort=name&page=$NUM")
if [ "$PAGE" = "[]" ]; then exit 0; fi
PACKAGES=$(echo $PAGE | jq -r "map({name: .name, url: .releases[0].url})")
echo $PACKAGES | jq -r '.[] | [.name, .url] | join(" ")' | while read -r NAMEURL; do
NAME=$(echo $NAMEURL | awk '{print $1;}')
URL=$(echo $NAMEURL | awk '{print $2;}')
VERSION=$(curl -s "$URL" | jq 'select(.meta.build_tools | index("rebar3")) | .version | tostring')
VERSION=$(echo $VERSION | tr -d '"')
if [ -n "$VERSION" ]; then
echo "$NAME $VERSION"
fi
done
NUM=$(expr $NUM + 1)
sleep 10
done