#!/usr/bin/env bash # This file is part of license-reporter # Copyright (C) 2017, 2018 David Hedlund # # license-reporter is free software: you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # license-reporter is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with this program. If not, see . #if [ "$data" == "search" ]; then search_page_variable='.results[]'; fi # Specifically for titles: en-US is sometimes unused, en-GB used to be used then. # sed "s|en-US|enUS|g" "$json_file" | jq "$search_page_variable.name.enUS" | sed "s|^\"||; s|\"$||;" # sed "s|en-GB|enGB|g" "$json_file" | jq "$search_page_variable.name.enGB" | sed "s|^\"||; s|\"$||;" # sed "s|en-US|enUS|g" "$json_file" | jq "$search_page_variable.homepage.enUS" | sed "s|^\"||; s|\"$||;" # sed "s|en-US|enUS|g" "$json_file" | jq "$search_page_variable.support_email.enUS" | sed "s|^\"||; s|\"$||;" # sed "s|en-US|enUS|g" "$json_file" | jq "$search_page_variable.support_url.enUS" | sed "s|^\"||; s|\"$||;" # Licenses # sed "s|en-US|enUS|g" "$slug.json" | jq '.license.name.enUS' | sed "s|^\"||; s|\"$||;" if [ "$2" == "--debug" ]; then debug=true; else debug=false; fi minimum_average_daily_users="1000000"; SCRIPTSRC=$(readlink -f "$0" || echo "$0") RUN_PATH=$(dirname "${SCRIPTSRC}" || echo .) filename=$(basename "$0"); export -p SCRIPTSRC RUN_PATH minimum_average_daily_users debug if [ ! -f /usr/bin/jq ]; then echo "/usr/bin/jq not found!"; exit=true; fi if [ ! -f /usr/bin/wget ]; then echo "/usr/bin/wget not found!"; exit=true; fi if [[ $exit == true ]]; then exit 1; fi function check_files { if [ ! -f "$RUN_PATH/license-reporter-$check_type" ]; then echo "$RUN_PATH/license-reporter-$check_type doesn't exist."; echo "Exiting" && exit else # Make sure all links are using SSL if grep -q "http://addons.mozilla.org/" $RUN_PATH/license-reporter-$check_type; then echo "Change http://addons.mozilla.org/ to https://addons.mozilla.org/ (https)." echo "Exiting" && exit fi fi } case "$1" in ""|-help) [ "$1" = "" ] && echo "Usage: $filename [--option] [--debug] OPTIONS $0 --all $0 --fresh-build $0 --make-repository-list Downloads add-on data for free add-ons from collections shared by defined users in license-reporter-repositories. Example: https://addons.mozilla.org/en-US/firefox/collections/mozilla/ $0 --make-collection-list $0 --make-custom-list $0 --make-search-list $0 --merge-lists $0 --download-licenses-json $0 --download-free-webextensions-for-gnu-and-linux $0 --verify-license-copy " && exit 1 ;; --fresh-build) if [ -d "build" ]; then rm -fr build fi mkdir -p build ;; --make-repository-list) # It is ok to distribute only-free programs on addons.mozilla.org even if they distribute nonfree programs. # This function requires _much_ less maintainance for custom add-on's, you don't need to manually sync # your addons.mozilla.org collection list with a separate text file. # https://github.com/mozilla/addons/issues/722 # Cannot list collections in desired formats # Cannot get a list of names of Collections from other users like https://addons.mozilla.org/collections/mozilla/ without authenication (see https://addons-server.readthedocs.io/en/latest/topics/api/collections.html#list). # So we have to parse it from HTML. # Get the links to the collections function get_repositories { check_type="repositories"; check_files cd build/ || exit for i in $(cat ../license-reporter-repositories); do user=$(echo $i | sed "s|https://addons.mozilla.org/en-US/firefox/collections/||; s|/||;"); rm -f repository-$user function wget_repository { match="^ ||" >> repository-$user } # Figure out if there are several pages number_of_pages=$(wget -qO- $i | grep "?page=" | tail -n 2 | head -n 1 | sed "s|page=|\npage=|g; s|\"|\n\"|g" | grep "page=" | sed "s|page=||"); if [ -z "$number_of_pages" ]; then echo "$i doesn't have any sub pages"; wget_repository else echo "$i has sub pages"; page_number=1; while [ $page_number -le $number_of_pages ] do wget_repository__page_extension="?page=$page_number"; echo "$wget_repository__page_extension" wget_repository page_number=$(( $page_number + 1 )) done fi done } get_repositories # Download the JSON files from the collections cd .. for x in $(find build/ -name repository* | sort); do for i in $(cat $x); do collection_name=$(echo $i | sed "s|https://addons.mozilla.org/en-US/firefox/collections/||; s|/|-|; s|/$||"); wget $i"format%3Ajson" -O "build/collection-$collection_name.json" done done ;; --make-collection-list) check_type="collections"; check_files cd build/ || exit for i in $(cat ../license-reporter-collections); do # https://addons.mozilla.org/en-US/firefox/collections/DavidHedlund/webextensions/format%3Ajson collection_name=$(echo $i | sed "s|https://addons.mozilla.org/en-US/firefox/collections/||; s|/|-|; s|/$||"); wget $i"format%3Ajson" -O "collection-$collection_name.json" done ;; --make-custom-list) check_type="custom"; check_files src/download-custom ;; --make-search-list) cd build/ || exit mkdir json cd json || exit # API documentation: https://addons-server.readthedocs.io/en/latest/topics/api/addons.html page="1" function foo() { # Do not evaluate the number of extensions seen in https://addons.mozilla.org/en-US/firefox/search/ in a Quantum based browser since that will hide legacy add-ons. uri_query="page=$page&platform=linux&sort=users&type=extension&tag=firefox57"; # Get the most popular WebExtensions wget "https://addons.mozilla.org/api/v3/addons/search/?$uri_query" -O "index.html?$uri_query.json" } foo if [ "$debug" == false ]; then while [ "$(jq ".results[].average_daily_users" "index.html?$uri_query.json" | tail -n 1)" -gt "$minimum_average_daily_users" ]; do ((page++)) foo done fi # Sort by file modification time stamp for the downloaded JSON files find index*.json -type f -printf "%Tc %p\n" | sort -n | awk '{print $NF}' | while read -r file; do line="0"; for average_daily_users in $(jq ".results[].average_daily_users" "$file"); do # Exclude add-ons with to low average daily users from index.html* if [ "$average_daily_users" -ge "$minimum_average_daily_users" ]; then echo -e "$average_daily_users\t$(jq ".results[$line].id" "$file")\t$file\t$(jq ".results[$line].slug" "$file" | sed "s|^\"||; s|\"$||;")" >> ../merged-search.txt fi ((line++)) done done ;; --merge-lists) cd build || exit cat merged-search.txt >> MERGED-ALL.txt cat merged-custom.txt >> MERGED-ALL.txt ;; --get-licenses) cd build/ || exit mkdir -p json/current_versions cd json/current_versions || exit line="0"; while IFS= read -r table; do ((line++)) id=$(echo $table | awk '{print $2}'); file="$RUN_PATH/build/json/"$(echo $table | awk '{print $3}'); wget -nc "https://addons.mozilla.org/api/v3/addons/addon/$(jq ".results[$line].slug" "$file" | sed "s|^\"||; s|\"$||;")/versions/$(jq ".results[$line].current_version.id" "$file")/" -O "$id.json" done < $RUN_PATH/build/MERGED-ALL.txt ;; --merged-free) cd build/ || exit cp -a MERGED-ALL.txt MERGED-ALL-freedom_status.txt line="0"; while IFS= read -r table; do ((line++)) id=$(echo $table | awk '{print $2}'); license=$(jq .license.name $RUN_PATH/build/json/current_versions/$id.json | sed "s|en-US|enUS|;" | jq .enUS | sed "s|^\"||; s|\"$||;"); # This is the complete list of pre-defined licenses listed on AMO. Apache License 2.0 is not on the list so its not easy to detect because it has to be released under a "Custom License". if [ "$license" == "GNU General Public License, version 3.0" ] || [ "$license" == "GNU General Public License, version 2.0" ] || [ "$license" == "GNU Lesser General Public License, version 3.0" ] || [ "$license" == "GNU Lesser General Public License, version 2.1" ] || [ "$license" == "Mozilla Public License, version 2.0" ] || [ "$license" == "Mozilla Public License Version 1.1" ] || [ "$license" == "BSD License" ] || [ "$license" == "MIT/X11 License" ] then # The nonfree add-ons should not be removed since the line number must correspond with the entry number in the search result JSON files. sed -i "$line""s/$/\\tfree/" MERGED-ALL-freedom_status.txt else sed -i "$line""s/$/\\tnonfree/" MERGED-ALL-freedom_status.txt fi done < $RUN_PATH/build/MERGED-ALL.txt ;; --generate-proposed-list) line="0"; while IFS= read -r table; do ((line++)) id=$(echo $table | awk '{print $2}'); source=$(echo $table | awk '{print $3}'); license=$(jq .license.name $RUN_PATH/build/json/current_versions/$id.json | sed "s|en-US|enUS|;" | jq .enUS | sed "s|^\"||; s|\"$||;"); freedom_status=$(echo $table | awk '{print $5}'); name=$(jq .results[$line].name $RUN_PATH/build/json/$source | sed "s|en-US|enUS|;" | jq .enUS | sed "s|^\"||; s|\"$||;"); if [ "$name" == "null" ]; then name=$(jq .results[$line].name $RUN_PATH/build/json/$source | sed "s|en-GB|enGB|;" | jq .enGB | sed "s|^\"||; s|\"$||;"); fi # Clean titles. Example of bad titles: "Ghostery – Privacy Ad Blocker" if [[ $name = *"–"* ]]; then name=$(echo $name | sed 's/–/\n/g; s/-/\n/g' | head -n 1); fi if [ "$freedom_status" == "free" ]; then echo "{{Checkme item |Section= |Package=$name |Package note= }}" fi done < $RUN_PATH/build/MERGED-ALL-freedom_status.txt ;; --download-free-webextensions-for-gnu-and-linux) cd build || exit rm -fr free_webextensions_for_GNU_and_Linux mkdir free_webextensions_for_GNU_and_Linux cd free_webextensions_for_GNU_and_Linux || exit line="0"; while IFS= read -r license; do ((line++)) # Add-ons not avalible for GNU/Linux will be ignored (used to be very few dough). wget -nc "https://addons.mozilla.org/firefox/downloads/latest/$slug/addon-$id-latest.xpi" || wget -nc "https://addons.mozilla.org/firefox/downloads/latest/$slug/platform:2/addon-$id-latest.xpi" done < ../license.name.enUS.txt ;; --verify-license-copy) cd build || exit rm -fr VERIFY-LICENSE-COPY.txt cd free_webextensions_for_GNU_and_Linux || exit while IFS= read -r id; do if [ ! -f "addon-$id-latest.xpi" ]; then echo "Nonfree" >> ../VERIFY-LICENSE-COPY.txt elif unzip -l "addon-$id-latest.xpi" | awk '{ print $4 }' | grep -q "^LICENSE$"; then echo "LICENSE" >> ../VERIFY-LICENSE-COPY.txt elif unzip -l "addon-$id-latest.xpi" | awk '{ print $4 }' | grep -q "^LICENSE.txt$"; then echo "LICENSE.txt" >> ../VERIFY-LICENSE-COPY.txt elif unzip -l "addon-$id-latest.xpi" | awk '{ print $4 }' | grep -q "^LICENSE.md$"; then echo "LICENSE.md" >> ../VERIFY-LICENSE-COPY.txt elif unzip -l "addon-$id-latest.xpi" | awk '{ print $4 }' | grep -q "^COPYING$"; then echo "COPYING" >> ../VERIFY-LICENSE-COPY.txt elif unzip -l "addon-$id-latest.xpi" | awk '{ print $4 }' | grep -q "^COPYING.txt$"; then echo "COPYING.txt" >> ../VERIFY-LICENSE-COPY.txt elif unzip -l "addon-$id-latest.xpi" | awk '{ print $4 }' | grep -q "^COPYING.md$"; then echo "COPYING.md" >> ../VERIFY-LICENSE-COPY.txt else echo "Request" >> ../VERIFY-LICENSE-COPY.txt fi done < ../id.txt line="0"; while IFS= read -r status; do ((line++)) average_daily_users="$(sed -n ${line}p ../average_daily_users.txt)"; id="$(sed -n ${line}p ../id.txt)"; slug="$(sed -n ${line}p ../slug.txt)"; license_name_en_US="$(sed -n ${line}p ../license.name.enUS.txt)"; homepage_en_US="$(sed -n ${line}p ../homepage.en-US.txt | sed "s|3A\\/\\/|\n|" | tail -n 1)"; support_email_en_US="$(sed -n ${line}p ../support_email.en-US.txt)"; support_url_en_US="$(sed -n ${line}p ../support_url.en-US.txt | sed "s|3A\\/\\/|\n|" | tail -n 1)"; if [ "$license_name_en_US" == "GNU General Public License, version 3.0" ]; then license_txt="https://www.gnu.org/licenses/gpl-3.0.txt"; license_file_name="COPYING"; elif [ "$license_name_en_US" == "GNU General Public License, version 2.0" ]; then license_txt="https://www.gnu.org/licenses/old-licenses/gpl-2.0.txt"; license_file_name="COPYING"; elif [ "$license_name_en_US" == "GNU Lesser General Public License, version 3.0" ]; then license_txt="https://www.gnu.org/licenses/lgpl-3.0.txt"; license_file_name="COPYING"; elif [ "$license_name_en_US" == "GNU Lesser General Public License, version 2.1" ]; then license_txt="https://www.gnu.org/licenses/old-licenses/lgpl-2.1.txt"; license_file_name="COPYING"; elif [ "$license_name_en_US" == "Mozilla Public License, version 2.0" ]; then license_txt="https://www.mozilla.org/media/MPL/2.0/index.txt"; license_file_name="LICENSE"; elif [ "$license_name_en_US" == "Mozilla Public License Version 1.1" ]; then license_txt="https://www.mozilla.org/media/MPL/1.1/index.txt"; license_file_name="LICENSE"; elif [ "$license_name_en_US" == "BSD License" ]; then license_txt="https://directory.fsf.org/wiki?title=License:FreeBSD"; license_file_name="LICENSE"; elif [ "$license_name_en_US" == "MIT/X11 License" ]; then license_txt="https://directory.fsf.org/wiki/License:X11"; license_file_name="LICENSE"; fi if [ "$(sed -n ${line}p ../name.en-US.txt)" != "null" ]; then name="$(sed -n ${line}p ../name.en-US.txt)"; elif [ "$(sed -n ${line}p ../name.en-GB.txt)" != "null" ]; then name="$(sed -n ${line}p ../name.en-GB.txt)"; else name="$slug"; fi if [ "$status" = "Request" ]; then ((count_reports++)) # Authors that don't provide contact information will be ignored, its impossible to track conversations in Reviews anyway, because they will be deleted. if [ "$homepage_en_US" != "null" ] || [ "$support_url_en_US" != "null" ] || [ "$support_email_en_US" != "null" ]; then decimals="$(echo "$average_daily_users" | sed -r ':L;s=\b([0-9]+)([0-9]{3})\b=\1,\2=g;t L')"; echo " $decimals average daily users: $name - https://addons.mozilla.org/en-US/firefox/addon/$slug/ Request: \"You have distributed $name under $license_name_en_US on https://addons.mozilla.org/en-US/firefox/addon/$slug/, but you have not added a copy of the license. can you please download the text of the license from $license_txt and add save it to file name $license_file_name and put it in the root directory of you program?\" by contacting:"; if [ "$homepage_en_US" != "null" ]; then echo " * Homepage (please submit Pull Request for $license_file_name if possible): $homepage_en_US"; fi if [ "$support_url_en_US" != "null" ]; then echo " * Support URL (please submit Pull Request for $license_file_name if possible): $support_url_en_US"; fi if [ "$support_email_en_US" != "null" ]; then echo " * Support E-mail: $support_email_en_US"; fi fi fi done < ../VERIFY-LICENSE-COPY.txt echo " ######################### $count_reports reports to submit"; ;; --all) $0 --fresh-build "$2" $0 --make-repository-list "$2" $0 --make-collection-list "$2" $0 --make-custom-list "$2" $0 --make-search-list "$2" $0 --merge-lists "$2" # $0 --download-licenses-json "$2" # $0 --download-free-webextensions-for-gnu-and-linux "$2" # $0 --verify-license-copy "$2" ;; esac