#!/usr/bin/env python3
################################################################################
#
# Copyright (c) 2020, Perforce Software, Inc. All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are met:
#
# 1. Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
#
# 2. Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
# ARE DISCLAIMED. IN NO EVENT SHALL PERFORCE SOFTWARE, INC. BE LIABLE FOR ANY
# DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
# (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
# LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
# ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
# THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
#
# DATE
#
# $Date: 2020/04/02 $
#
# SYNOPSIS
#
# BOMDetection.py file
#
# DESCRIPTION
#
# This script checks for any UTF8 BOM in file
# It is intended to be against a list of server depot file of utf8 filetype
# which be encoded in UTF8 no BOM
# Example of command to be run on the server itself:
# p4 -F%lbrPath% fstat -Obf -F headType=*utf8* //... | python BOMDetection.py
# (the above -Ob flag requires a 2017.2 or higher server)
#
################################################################################
from __future__ import print_function
import sys
import re
def main():
if len(sys.argv) > 1:
sys.exit("stdin argument only, see script header")
else:
for file in sys.stdin:
filename = file.splitlines()[0]
for line in open(filename, "rb"):
if re.search(b"\xEF\xBB\xBF", line):
print("UTF8 BOM detected in " + filename)
break
if __name__ == '__main__':
main()