blob: b38b398b08174d2deb759c7bd8d655a9a5e6777a [file] [log] [blame]
#!/bin/bash
# Copyright 2021 The Chromium Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
# Produce a list of directories that contain files with instances of
# non-inclusive language (e.g. whitelist, blacklist, master, slave). // nocheck
# Each line is formatted:
# <path> <instance count across files> <distinct file count>
# (separated by spaces). The counts are not recursive, so they do not sum up
# values from child directories, only files directly in the listed path.
#
# The intended consumer of this list is the CheckInclusiveLanguage function
# in ../PRESUBMIT.py. It does not perform its check on files directly under
# the paths listed here.
#
# See https://bugs.chromium.org/p/chromium/issues/detail?id=1177609 for more
# context.
#
# To update the list so the PRESUBMIT will use it in prod, write the output to
# ./inclusive_language_presubmit_exempt_dirs in a new CL, and land it. Example:
#
# % infra/update_inclusive_language_presubmit_exempt_dirs.sh > \
# infra/inclusive_language_presubmit_exempt_dirs.txt
#
# Note: This script produces the list relative to the current working dir.
# To generate the list of exempted legacy directories for chromium/src for
# instance, you should run this from the parent of the current directory
# rather than from this directory.
NON_INCLUSIVE_TERMS='\b((black|white)list|master|slave)\b' # // nocheck
git grep -c -E $NON_INCLUSIVE_TERMS | \
awk -F ":" 'NF {cmd=sprintf("dirname %s",$1);cmd | getline dirname; \
a[dirname] += $2; b[dirname] += 1} END {for (i in a) print i, a[i], b[i]}' \
| sort