blob: 4c97c37ba026293446bd673148a679d78026fd2f [file] [log] [blame]
Martin Rothae39fc42016-07-29 14:20:55 -06001#!/bin/sh
Martin Rothae39fc42016-07-29 14:20:55 -06002#
Patrick Georgi7333a112020-05-08 20:48:04 +02003# SPDX-License-Identifier: GPL-2.0-only
4
Martin Rothae39fc42016-07-29 14:20:55 -06005# DESCR: Check for non-ASCII and unprintable characters
6
7LC_ALL=C export LC_ALL
8
9INCLUDED_FILES='\.[chsS]$\|\.asl$\|\.cb$\|\.inc$\|Kconfig\|\.ld$|\.txt\|\.hex'
Martin Roth3748aae2018-09-02 18:49:12 -060010EXCLUDED_DIRS='^payloads/external/\|^src/vendorcode/\|^Documentation/'
Martin Rothae39fc42016-07-29 14:20:55 -060011EXCLUDED_FILES='to-wiki/towiki\.sh$\|vga/vga_font\|video/font\|PDCurses.*x11'
Martin Roth3748aae2018-09-02 18:49:12 -060012EXCLUDED_PHRASES='Copyright\|Ported to\|Intel®\|°C\|°F\|Athlon™\|Copyright.*©'
Martin Rothae39fc42016-07-29 14:20:55 -060013
Martin Roth300b25a2018-09-02 18:45:43 -060014# Exit if git isn't present or the code isn't in a git repo
15if [ -z "$(command -v git)" ] || \
16 [ "$(git rev-parse --is-inside-work-tree 2>/dev/null)" != "true" ]
Alex Thiessen73f19dc2018-01-16 23:05:48 +000017then
Martin Roth300b25a2018-09-02 18:45:43 -060018 exit
Martin Rothae39fc42016-07-29 14:20:55 -060019fi
20
21# 1. Get the list of files to parse and send them through grep
22# 2. Find any characters that aren't TAB, or space (0x20) to ~ (0x7F)
23# LF (0x10) isn't included, as it ends the grep line
24# 3. Remove common phrases and names that have been found
25# 4. Run the result through grep again to highlight the issues that were
26# found. Without this step, the characters can be difficult to see.
Martin Roth300b25a2018-09-02 18:45:43 -060027# shellcheck disable=SC2046
28git grep -lP "[^\t-~]" | \
29 grep "$INCLUDED_FILES" | \
30 grep -v "$EXCLUDED_DIRS" | \
31 grep -v "$EXCLUDED_FILES" | \
32 xargs -I % \
33 grep -n "[^ -~]" % | \
34 grep -iv "$EXCLUDED_PHRASES" | \
35 grep --color='auto' "[^ -~]"