File: clean-mirror.sh

package info (click to toggle)
node-yarnpkg 1.13.0-1%2Bdeb10u1
  • links: PTS, VCS
  • area: main
  • in suites: buster
  • size: 93,036 kB
  • sloc: sh: 323; makefile: 19
file content (126 lines) | stat: -rwxr-xr-x 3,942 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
#!/usr/bin/env bash

# This script finds all packages located inside an offline mirror, all packages referenced by yarn.lock files, and remove those which aren't referenced anymore.
# The first argument is the directory where your offline mirror lives, and the second one is the location where the script should recursively start looking for yarn.lock files.
# If you only have a single project in your mirror, you can use the purge configuration to automatically remove packages from it as they are dereferenced (`yarn config set yarn-offline-mirror-pruning true`).

set -e

DRY_RUN=0
MAKE_STATS=0

OPTIND=1; while getopts "ds" opt; do
    case "$opt" in
        d) DRY_RUN=1;;
        s) MAKE_STATS=1;;
    esac
done

shift $((OPTIND-1))

if [[ "$#" -ne 2 ]] || ! [[ -d "$1" ]] || ! [[ -d "$2" ]]; then
    echo "Usage: $0 <offline mirror path> <projects common path>" >&2
    exit 1
fi

TEMP=$(mktemp -d)
trap "rm -rf $TEMP" EXIT

MIRROR="$1"
SOURCES="$2"

# Find all yarn.lock files in the source directory
find "${SOURCES}" -type f -name yarn.lock > "${TEMP}.ylocks"

# Extract the part right before the hash, and remove duplicates
xargs cat < "${TEMP}.ylocks" | grep -E '^[ \t]*resolved[ \t]+' | perl -pe 's/^(?:[^\/ \n]*[\/ ])*([^#]*)#.*$/\1/gm' | sort | uniq > "${TEMP}.deps"

# Obtain the list of package filenames from the specified directory
find "${MIRROR}" -maxdepth 1 \( -type f -a -not -name '.*' \) -exec basename {} \; | sort > "${TEMP}.files"

# Compute the list of files that are in the directory but not in the dependencies
comm -13 "${TEMP}.deps" "${TEMP}.files" > "${TEMP}.diff"

# Get the number of lockfiles we've found
ylocks=$(wc -l < "${TEMP}.ylocks" | grep -oE [0-9]+)

# Compute the total number of files in the directory
total=$(wc -l < "${TEMP}.files" | grep -oE [0-9]+)

# Early exits if we have no diff
diff=$(wc -l < "${TEMP}.diff" | grep -oE [0-9]+)

if [[ $diff -eq 0 ]]; then

    echo "No garbage found." >&2
    exit 0

elif [[ $ylocks -eq 0 ]]; then

    echo "No lockfiles found. If this is to be expected, please just remove the offline mirror by hand." >&2
    exit 125

else

    # If in dry run, we can just print this list and exits
    if [[ $DRY_RUN -eq 1 ]]; then

        if [[ $diff -eq $total ]]; then
            echo "Assertion failed: running this script would remove all packages."
            echo
        fi

        echo "# Lockfiles"
        echo
        cat "${TEMP}.ylocks"
        echo
        echo "# Unreferenced packages"
        echo
        cat "${TEMP}.diff"

        if [[ $MAKE_STATS -eq 1 ]]; then
            size=$(cd "${MIRROR}" && xargs -n1 wc -c < "${TEMP}.diff" | awk '{s+=$1}END{print s}')
            echo
            echo "Removing them would free about $(numfmt --to=iec-i --suffix=B --format="%.3f" $size)"
        fi

        if [[ $diff -eq $total ]]; then
            exit 1
        else
            exit 0
        fi

    else

        if [[ $diff -eq $total ]]; then

            echo "Assertion failed: running this script would remove all packages." >&2
            exit 1

        else

            # Compute the extensions used by the soon-to-be-removed files
            exts=$(grep -oE '(\.[a-z]+)+$' < "${TEMP}.diff" | sort | uniq | paste -sd ', ' -)

            # Check with the user that everything is ok
            response=
            while ! [[ $response =~ ^(yes|y|no|n)$ ]]; do
                read -r -p "This command will remove ${diff} file(s) (extensions are: ${exts}). Are you sure? [Y/n] " response < /dev/tty
                response=$(tr '[:upper:]' '[:lower:]' <<< "${response}")
            done

            if [[ $response =~ ^(yes|y)$ ]]; then
                cd "${MIRROR}"
                sed 's/\r\n?/\n/g' < "${TEMP}.diff" | while read -r filename; do
                    echo "Removing ${filename}..."
                    rm "${filename}"
                done
            fi

            exit 0

        fi

    fi

fi