Tools/Scripts/webkitpy/style/filereader.py - WebKit - Git at Google

 # Copyright (C) 2009 Google Inc. All rights reserved.
 # Copyright (C) 2010 Chris Jerdonek (chris.jerdonek@gmail.com)
 # Copyright (C) 2010 ProFUSION embedded systems
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions are
 # met:
 #
 #     * Redistributions of source code must retain the above copyright
 # notice, this list of conditions and the following disclaimer.
 #     * Redistributions in binary form must reproduce the above
 # copyright notice, this list of conditions and the following disclaimer
 # in the documentation and/or other materials provided with the
 # distribution.
 #     * Neither the name of Google Inc. nor the names of its
 # contributors may be used to endorse or promote products derived from
 # this software without specific prior written permission.
 #
 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 """Supports reading and processing text files."""

 import logging
 import sys

 from webkitpy.common.host import Host


 _log = logging.getLogger(__name__)


 class TextFileReader(object):

     """Supports reading and processing text files.

        Attributes:
          file_count: The total number of files passed to this instance
                      for processing, including non-text files and files
                      that should be skipped.
          delete_only_file_count: The total number of files that are not
                                  processed this instance actually because
                                  the files don't have any modified lines
                                  but should be treated as processed.

     """

     def __init__(self, filesystem, processor):
         """Create an instance.

         Arguments:
           processor: A ProcessorBase instance.

         """

         self.filesystem = filesystem
         self._processor = processor
         self._files = {}
         self.delete_only_file_count = 0

     @property
     def file_count(self):
         return len(self._files) - self.delete_only_file_count

     def _read_lines(self, file_path):
         """Read the file at a path, and return its lines.

         Raises:
           IOError: If the file does not exist or cannot be read.

         """
         # Support the UNIX convention of using "-" for stdin.
         if file_path == '-':
             file = self.filesystem.open_stdin()
         else:
             # We do not open the file with universal newline support
             # (codecs does not support it anyway), so the resulting
             # lines contain trailing "\r" characters if we are reading
             # a file with CRLF endings.
             file = self.filesystem.open_text_file_for_reading(file_path, 'replace')

         try:
             contents = file.read()
         finally:
             file.close()

         lines = contents.split('\n')
         return lines

     def process_file(self, file_path, **kwargs):
         """Process the given file by calling the processor's process() method.

         Args:
           file_path: The path of the file to process.
           **kwargs: Any additional keyword parameters that should be passed
                     to the processor's process() method.  The process()
                     method should support these keyword arguments.

         Raises:
           SystemExit: If no file at file_path exists.

         """
         abs_file_path = self.filesystem.abspath(file_path)
         if abs_file_path not in self._files:
             self._files[abs_file_path] = None
         if kwargs.get('line_numbers'):
             # Deleted files will be 'None', but if a file has modified lines, this information should override the 'None'
             if self._files[abs_file_path] is None:
                 self._files[abs_file_path] = []
             self._files[abs_file_path] = self._files[abs_file_path] + kwargs['line_numbers']

         if not self.filesystem.exists(file_path) and file_path != "-":
             _log.error("File does not exist: '%s'" % file_path)
             raise IOError("File does not exist")

         if not self._processor.should_process(file_path):
             _log.debug("Skipping file: '%s'" % file_path)
             return
         _log.debug("Processing file: '%s'" % file_path)

         try:
             lines = self._read_lines(file_path)
         except IOError as err:
             message = ("Could not read file. Skipping: '%s'\n  %s" % (file_path, err))
             _log.warn(message)
             return

         self._processor.process(lines, file_path, **kwargs)

     def _process_directory(self, directory):
         """Process all files in the given directory, recursively."""
         for file_path in self.filesystem.files_under(directory):
             self.process_file(file_path)

     def process_paths(self, paths):
         for path in paths:
             if self.filesystem.isdir(path):
                 self._process_directory(directory=path)
             else:
                 self.process_file(path)

     def do_association_check(self, cwd, host=Host()):
         self._processor.do_association_check(self._files, cwd, host=host)

     def delete_file(self, file_path=None):
         """Keep track of deleted files.

         Files which has no modified or newly-added lines don't need
         to check style, but they may effect the association check.
         """
         if file_path:
             self._files[self.filesystem.abspath(file_path)] = None
         self.delete_only_file_count += 1
	# Copyright (C) 2009 Google Inc. All rights reserved.
	# Copyright (C) 2010 Chris Jerdonek (chris.jerdonek@gmail.com)
	# Copyright (C) 2010 ProFUSION embedded systems
	#
	# Redistribution and use in source and binary forms, with or without
	# modification, are permitted provided that the following conditions are
	# met:
	#
	# * Redistributions of source code must retain the above copyright
	# notice, this list of conditions and the following disclaimer.
	# * Redistributions in binary form must reproduce the above
	# copyright notice, this list of conditions and the following disclaimer
	# in the documentation and/or other materials provided with the
	# distribution.
	# * Neither the name of Google Inc. nor the names of its
	# contributors may be used to endorse or promote products derived from
	# this software without specific prior written permission.
	#
	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

	"""Supports reading and processing text files."""

	import logging
	import sys

	from webkitpy.common.host import Host


	_log = logging.getLogger(__name__)


	class TextFileReader(object):

	"""Supports reading and processing text files.

	Attributes:
	file_count: The total number of files passed to this instance
	for processing, including non-text files and files
	that should be skipped.
	delete_only_file_count: The total number of files that are not
	processed this instance actually because
	the files don't have any modified lines
	but should be treated as processed.

	"""

	def __init__(self, filesystem, processor):
	"""Create an instance.

	Arguments:
	processor: A ProcessorBase instance.

	"""

	self.filesystem = filesystem
	self._processor = processor
	self._files = {}
	self.delete_only_file_count = 0

	@property
	def file_count(self):
	return len(self._files) - self.delete_only_file_count

	def _read_lines(self, file_path):
	"""Read the file at a path, and return its lines.

	Raises:
	IOError: If the file does not exist or cannot be read.

	"""
	# Support the UNIX convention of using "-" for stdin.
	if file_path == '-':
	file = self.filesystem.open_stdin()
	else:
	# We do not open the file with universal newline support
	# (codecs does not support it anyway), so the resulting
	# lines contain trailing "\r" characters if we are reading
	# a file with CRLF endings.
	file = self.filesystem.open_text_file_for_reading(file_path, 'replace')

	try:
	contents = file.read()
	finally:
	file.close()

	lines = contents.split('\n')
	return lines

	def process_file(self, file_path, **kwargs):
	"""Process the given file by calling the processor's process() method.

	Args:
	file_path: The path of the file to process.
	**kwargs: Any additional keyword parameters that should be passed
	to the processor's process() method. The process()
	method should support these keyword arguments.

	Raises:
	SystemExit: If no file at file_path exists.

	"""
	abs_file_path = self.filesystem.abspath(file_path)
	if abs_file_path not in self._files:
	self._files[abs_file_path] = None
	if kwargs.get('line_numbers'):
	# Deleted files will be 'None', but if a file has modified lines, this information should override the 'None'
	if self._files[abs_file_path] is None:
	self._files[abs_file_path] = []
	self._files[abs_file_path] = self._files[abs_file_path] + kwargs['line_numbers']

	if not self.filesystem.exists(file_path) and file_path != "-":
	_log.error("File does not exist: '%s'" % file_path)
	raise IOError("File does not exist")

	if not self._processor.should_process(file_path):
	_log.debug("Skipping file: '%s'" % file_path)
	return
	_log.debug("Processing file: '%s'" % file_path)

	try:
	lines = self._read_lines(file_path)
	except IOError as err:
	message = ("Could not read file. Skipping: '%s'\n %s" % (file_path, err))
	_log.warn(message)
	return

	self._processor.process(lines, file_path, **kwargs)

	def _process_directory(self, directory):
	"""Process all files in the given directory, recursively."""
	for file_path in self.filesystem.files_under(directory):
	self.process_file(file_path)

	def process_paths(self, paths):
	for path in paths:
	if self.filesystem.isdir(path):
	self._process_directory(directory=path)
	else:
	self.process_file(path)

	def do_association_check(self, cwd, host=Host()):
	self._processor.do_association_check(self._files, cwd, host=host)

	def delete_file(self, file_path=None):
	"""Keep track of deleted files.

	Files which has no modified or newly-added lines don't need
	to check style, but they may effect the association check.
	"""
	if file_path:
	self._files[self.filesystem.abspath(file_path)] = None
	self.delete_only_file_count += 1