torch/_tensor_str.py - platform/external/pytorch - Git at Google

 import math
 import torch
 from torch._six import inf
 from typing import Optional


 class __PrinterOptions(object):
     precision: int = 4
     threshold: float = 1000
     edgeitems: int = 3
     linewidth: int = 80
     sci_mode: Optional[bool] = None


 PRINT_OPTS = __PrinterOptions()


 # We could use **kwargs, but this will give better docs
 def set_printoptions(
         precision=None,
         threshold=None,
         edgeitems=None,
         linewidth=None,
         profile=None,
         sci_mode=None
 ):
     r"""Set options for printing. Items shamelessly taken from NumPy

     Args:
         precision: Number of digits of precision for floating point output
             (default = 4).
         threshold: Total number of array elements which trigger summarization
             rather than full `repr` (default = 1000).
         edgeitems: Number of array items in summary at beginning and end of
             each dimension (default = 3).
         linewidth: The number of characters per line for the purpose of
             inserting line breaks (default = 80). Thresholded matrices will
             ignore this parameter.
         profile: Sane defaults for pretty printing. Can override with any of
             the above options. (any one of `default`, `short`, `full`)
         sci_mode: Enable (True) or disable (False) scientific notation. If
             None (default) is specified, the value is defined by
             `torch._tensor_str._Formatter`. This value is automatically chosen
             by the framework.

     Example::

         >>> torch.set_printoptions(precision=2)
         >>> torch.tensor([1.12345])
         tensor([1.12])
         >>> torch.set_printoptions(threshold=5)
         >>> torch.arange(10)
         tensor([0, 1, 2, ..., 7, 8, 9])

     """
     if profile is not None:
         if profile == "default":
             PRINT_OPTS.precision = 4
             PRINT_OPTS.threshold = 1000
             PRINT_OPTS.edgeitems = 3
             PRINT_OPTS.linewidth = 80
         elif profile == "short":
             PRINT_OPTS.precision = 2
             PRINT_OPTS.threshold = 1000
             PRINT_OPTS.edgeitems = 2
             PRINT_OPTS.linewidth = 80
         elif profile == "full":
             PRINT_OPTS.precision = 4
             PRINT_OPTS.threshold = inf
             PRINT_OPTS.edgeitems = 3
             PRINT_OPTS.linewidth = 80

     if precision is not None:
         PRINT_OPTS.precision = precision
     if threshold is not None:
         PRINT_OPTS.threshold = threshold
     if edgeitems is not None:
         PRINT_OPTS.edgeitems = edgeitems
     if linewidth is not None:
         PRINT_OPTS.linewidth = linewidth
     PRINT_OPTS.sci_mode = sci_mode

 def tensor_totype(t):
     dtype = torch.float if t.is_mps else torch.double
     return t.to(dtype=dtype)

 class _Formatter(object):
     def __init__(self, tensor):
         self.floating_dtype = tensor.dtype.is_floating_point
         self.int_mode = True
         self.sci_mode = False
         self.max_width = 1

         with torch.no_grad():
             tensor_view = tensor.reshape(-1)

         if not self.floating_dtype:
             for value in tensor_view:
                 value_str = '{}'.format(value)
                 self.max_width = max(self.max_width, len(value_str))

         else:
             nonzero_finite_vals = torch.masked_select(tensor_view, torch.isfinite(tensor_view) & tensor_view.ne(0))

             if nonzero_finite_vals.numel() == 0:
                 # no valid number, do nothing
                 return

             # Convert to double for easy calculation. HalfTensor overflows with 1e8, and there's no div() on CPU.
             nonzero_finite_abs = tensor_totype(nonzero_finite_vals.abs())
             nonzero_finite_min = tensor_totype(nonzero_finite_abs.min())
             nonzero_finite_max = tensor_totype(nonzero_finite_abs.max())

             for value in nonzero_finite_vals:
                 if value != torch.ceil(value):
                     self.int_mode = False
                     break

             if self.int_mode:
                 # in int_mode for floats, all numbers are integers, and we append a decimal to nonfinites
                 # to indicate that the tensor is of floating type. add 1 to the len to account for this.
                 if nonzero_finite_max / nonzero_finite_min > 1000. or nonzero_finite_max > 1.e8:
                     self.sci_mode = True
                     for value in nonzero_finite_vals:
                         value_str = ('{{:.{}e}}').format(PRINT_OPTS.precision).format(value)
                         self.max_width = max(self.max_width, len(value_str))
                 else:
                     for value in nonzero_finite_vals:
                         value_str = ('{:.0f}').format(value)
                         self.max_width = max(self.max_width, len(value_str) + 1)
             else:
                 # Check if scientific representation should be used.
                 if nonzero_finite_max / nonzero_finite_min > 1000.\
                         or nonzero_finite_max > 1.e8\
                         or nonzero_finite_min < 1.e-4:
                     self.sci_mode = True
                     for value in nonzero_finite_vals:
                         value_str = ('{{:.{}e}}').format(PRINT_OPTS.precision).format(value)
                         self.max_width = max(self.max_width, len(value_str))
                 else:
                     for value in nonzero_finite_vals:
                         value_str = ('{{:.{}f}}').format(PRINT_OPTS.precision).format(value)
                         self.max_width = max(self.max_width, len(value_str))

         if PRINT_OPTS.sci_mode is not None:
             self.sci_mode = PRINT_OPTS.sci_mode

     def width(self):
         return self.max_width

     def format(self, value):
         if self.floating_dtype:
             if self.sci_mode:
                 ret = ('{{:{}.{}e}}').format(self.max_width, PRINT_OPTS.precision).format(value)
             elif self.int_mode:
                 ret = '{:.0f}'.format(value)
                 if not (math.isinf(value) or math.isnan(value)):
                     ret += '.'
             else:
                 ret = ('{{:.{}f}}').format(PRINT_OPTS.precision).format(value)
         else:
             ret = '{}'.format(value)
         return (self.max_width - len(ret)) * ' ' + ret


 def _scalar_str(self, formatter1, formatter2=None):
     if formatter2 is not None:
         real_str = _scalar_str(self.real, formatter1)
         imag_str = (_scalar_str(self.imag, formatter2) + "j").lstrip()
         # handles negative numbers, +0.0, -0.0
         if imag_str[0] == '+' or imag_str[0] == '-':
             return real_str + imag_str
         else:
             return real_str + "+" + imag_str
     else:
         return formatter1.format(self.item())

 def _vector_str(self, indent, summarize, formatter1, formatter2=None):
     # length includes spaces and comma between elements
     element_length = formatter1.width() + 2
     if formatter2 is not None:
         # width for imag_formatter + an extra j for complex
         element_length += formatter2.width() + 1

     elements_per_line = max(1, int(math.floor((PRINT_OPTS.linewidth - indent) / (element_length))))
     char_per_line = element_length * elements_per_line

     def _val_formatter(val, formatter1=formatter1, formatter2=formatter2):
         if formatter2 is not None:
             real_str = formatter1.format(val.real)
             imag_str = (formatter2.format(val.imag) + "j").lstrip()
             # handles negative numbers, +0.0, -0.0
             if imag_str[0] == '+' or imag_str[0] == '-':
                 return real_str + imag_str
             else:
                 return real_str + "+" + imag_str
         else:
             return formatter1.format(val)

     if summarize and self.size(0) > 2 * PRINT_OPTS.edgeitems:
         data = ([_val_formatter(val) for val in self[:PRINT_OPTS.edgeitems].tolist()] +
                 [' ...'] +
                 [_val_formatter(val) for val in self[-PRINT_OPTS.edgeitems:].tolist()])
     else:
         data = [_val_formatter(val) for val in self.tolist()]

     data_lines = [data[i:i + elements_per_line] for i in range(0, len(data), elements_per_line)]
     lines = [', '.join(line) for line in data_lines]
     return '[' + (',' + '\n' + ' ' * (indent + 1)).join(lines) + ']'

 # formatter2 is only used for printing complex tensors.
 # For complex tensors, formatter1 and formatter2 are the formatters for tensor.real
 # and tensor.imag respesectively
 def _tensor_str_with_formatter(self, indent, summarize, formatter1, formatter2=None):
     dim = self.dim()

     if dim == 0:
         return _scalar_str(self, formatter1, formatter2)

     if dim == 1:
         return _vector_str(self, indent, summarize, formatter1, formatter2)

     if summarize and self.size(0) > 2 * PRINT_OPTS.edgeitems:
         slices = ([_tensor_str_with_formatter(self[i], indent + 1, summarize, formatter1, formatter2)
                    for i in range(0, PRINT_OPTS.edgeitems)] +
                   ['...'] +
                   [_tensor_str_with_formatter(self[i], indent + 1, summarize, formatter1, formatter2)
                    for i in range(len(self) - PRINT_OPTS.edgeitems, len(self))])
     else:
         slices = [_tensor_str_with_formatter(self[i], indent + 1, summarize, formatter1, formatter2)
                   for i in range(0, self.size(0))]

     tensor_str = (',' + '\n' * (dim - 1) + ' ' * (indent + 1)).join(slices)
     return '[' + tensor_str + ']'

 def _tensor_str(self, indent):
     if self.numel() == 0:
         return '[]'

     if self.has_names():
         # There are two main codepaths (possibly more) that tensor printing goes through:
         # - tensor data can fit comfortably on screen
         # - tensor data needs to be summarized
         # Some of the codepaths don't fully support named tensors, so we send in
         # an unnamed tensor to the formatting code as a workaround.
         self = self.rename(None)

     summarize = self.numel() > PRINT_OPTS.threshold

     if self._is_zerotensor():
         self = self.clone()

     # handle the negative bit
     if self.is_neg():
         self = self.resolve_neg()

     if self.dtype is torch.float16 or self.dtype is torch.bfloat16:
         self = self.float()

     if self.dtype is torch.complex32:
         self = self.cfloat()

     if self.dtype.is_complex:
         # handle the conjugate bit
         self = self.resolve_conj()
         real_formatter = _Formatter(get_summarized_data(self.real) if summarize else self.real)
         imag_formatter = _Formatter(get_summarized_data(self.imag) if summarize else self.imag)
         return _tensor_str_with_formatter(self, indent, summarize, real_formatter, imag_formatter)
     else:
         formatter = _Formatter(get_summarized_data(self) if summarize else self)
         return _tensor_str_with_formatter(self, indent, summarize, formatter)

 def _add_suffixes(tensor_str, suffixes, indent, force_newline):
     tensor_strs = [tensor_str]
     last_line_len = len(tensor_str) - tensor_str.rfind('\n') + 1
     for suffix in suffixes:
         suffix_len = len(suffix)
         if force_newline or last_line_len + suffix_len + 2 > PRINT_OPTS.linewidth:
             tensor_strs.append(',\n' + ' ' * indent + suffix)
             last_line_len = indent + suffix_len
             force_newline = False
         else:
             tensor_strs.append(', ' + suffix)
             last_line_len += suffix_len + 2
     tensor_strs.append(')')
     return ''.join(tensor_strs)


 def get_summarized_data(self):
     dim = self.dim()
     if dim == 0:
         return self
     if dim == 1:
         if self.size(0) > 2 * PRINT_OPTS.edgeitems:
             return torch.cat((self[:PRINT_OPTS.edgeitems], self[-PRINT_OPTS.edgeitems:]))
         else:
             return self
     if self.size(0) > 2 * PRINT_OPTS.edgeitems:
         start = [self[i] for i in range(0, PRINT_OPTS.edgeitems)]
         end = ([self[i]
                for i in range(len(self) - PRINT_OPTS.edgeitems, len(self))])
         return torch.stack([get_summarized_data(x) for x in (start + end)])
     else:
         return torch.stack([get_summarized_data(x) for x in self])

 def _str_intern(inp, *, tensor_contents=None):
     is_plain_tensor = type(inp) is torch.Tensor or type(inp) is torch.nn.Parameter
     if inp.is_nested:
         prefix = "nested_tensor("
     elif is_plain_tensor:
         prefix = 'tensor('
     else:
         prefix = f"{type(inp).__name__}("
     indent = len(prefix)
     suffixes = []
     custom_contents_provided = tensor_contents is not None
     if custom_contents_provided:
         tensor_str = tensor_contents

     # This is used to extract the primal value and thus disable the forward AD
     # within this function.
     # TODO(albanD) This needs to be updated when more than one level is supported
     self, tangent = torch.autograd.forward_ad.unpack_dual(inp)

     # Note [Print tensor device]:
     # A general logic here is we only print device when it doesn't match
     # the device specified in default tensor type.
     # Currently torch.set_default_tensor_type() only supports CPU/CUDA, thus
     # torch._C._get_default_device() only returns either cpu or cuda.
     # In other cases, we don't have a way to set them as default yet,
     # and we should always print out device for them.
     if self.device.type != torch._C._get_default_device()\
             or (self.device.type == 'cuda' and torch.cuda.current_device() != self.device.index)\
             or (self.device.type == 'mps'):
         suffixes.append('device=\'' + str(self.device) + '\'')

     # Tensor printing performs tensor operations like slice, indexing, etc to make it in a
     # representable format. These operations on ipu/xla/lazy tensor results in compilations. Hence,
     # to avoid compilations, copying the tensor to cpu before printing.
     if self.device.type in ['xla', 'lazy', 'ipu']:
         self = self.to('cpu')

     # TODO: add an API to map real -> complex dtypes
     _default_complex_dtype = torch.cdouble if torch.get_default_dtype() == torch.double else torch.cfloat
     has_default_dtype = self.dtype in (torch.get_default_dtype(), _default_complex_dtype, torch.int64, torch.bool)
     if self.is_sparse:
         suffixes.append('size=' + str(tuple(self.shape)))
         suffixes.append('nnz=' + str(self._nnz()))
         if not has_default_dtype:
             suffixes.append('dtype=' + str(self.dtype))
         if not custom_contents_provided:
             indices_prefix = 'indices=tensor('
             indices = self._indices().detach()
             indices_str = _tensor_str(indices, indent + len(indices_prefix))
             if indices.numel() == 0:
                 indices_str += ', size=' + str(tuple(indices.shape))
             values_prefix = 'values=tensor('
             values = self._values().detach()
             values_str = _tensor_str(values, indent + len(values_prefix))
             if values.numel() == 0:
                 values_str += ', size=' + str(tuple(values.shape))
             tensor_str = indices_prefix + indices_str + '),\n' + ' ' * indent + values_prefix + values_str + ')'
     elif self.layout in {torch.sparse_csr, torch.sparse_csc, torch.sparse_bsr, torch.sparse_bsc}:
         suffixes.append('size=' + str(tuple(self.shape)))
         suffixes.append('nnz=' + str(self._nnz()))
         if not has_default_dtype:
             suffixes.append('dtype=' + str(self.dtype))
         if not custom_contents_provided:
             compressed_indices_method, plain_indices_method = {
                 torch.sparse_csr: (torch.Tensor.crow_indices, torch.Tensor.col_indices),
                 torch.sparse_csc: (torch.Tensor.ccol_indices, torch.Tensor.row_indices),
                 torch.sparse_bsr: (torch.Tensor.crow_indices, torch.Tensor.col_indices),
                 torch.sparse_bsc: (torch.Tensor.ccol_indices, torch.Tensor.row_indices),
             }[self.layout]
             if self.layout in {torch.sparse_csr, torch.sparse_bsr}:
                 cdimname, pdimname = 'row', 'column'
             else:
                 cdimname, pdimname = 'column', 'row'
             compressed_indices_prefix = f'c{cdimname[:3]}_indices=tensor('
             compressed_indices = compressed_indices_method(self).detach()
             compressed_indices_str = _tensor_str(compressed_indices, indent + len(compressed_indices_prefix))
             if compressed_indices.numel() == 0:
                 compressed_indices_str += ', size=' + str(tuple(compressed_indices.shape))
             plain_indices_prefix = f'{pdimname[:3]}_indices=tensor('
             plain_indices = plain_indices_method(self).detach()
             plain_indices_str = _tensor_str(plain_indices, indent + len(plain_indices_prefix))
             if plain_indices.numel() == 0:
                 plain_indices_str += ', size=' + str(tuple(plain_indices.shape))
             values_prefix = 'values=tensor('
             values = self.values().detach()
             values_str = _tensor_str(values, indent + len(values_prefix))
             if values.numel() == 0:
                 values_str += ', size=' + str(tuple(values.shape))
             tensor_str = compressed_indices_prefix + compressed_indices_str + '),\n' + ' ' * indent +\
                 plain_indices_prefix + plain_indices_str + '),\n' + ' ' * indent +\
                 values_prefix + values_str + ')'
     elif self.is_quantized:
         suffixes.append('size=' + str(tuple(self.shape)))
         if not has_default_dtype:
             suffixes.append('dtype=' + str(self.dtype))
         suffixes.append('quantization_scheme=' + str(self.qscheme()))
         if self.qscheme() == torch.per_tensor_affine or self.qscheme() == torch.per_tensor_symmetric:
             suffixes.append('scale=' + str(self.q_scale()))
             suffixes.append('zero_point=' + str(self.q_zero_point()))
         elif self.qscheme() == torch.per_channel_affine or self.qscheme() == torch.per_channel_symmetric \
                 or self.qscheme() == torch.per_channel_affine_float_qparams:
             suffixes.append('scale=' + str(self.q_per_channel_scales()))
             suffixes.append('zero_point=' + str(self.q_per_channel_zero_points()))
             suffixes.append('axis=' + str(self.q_per_channel_axis()))
         if not custom_contents_provided:
             tensor_str = _tensor_str(self.dequantize(), indent)
     elif self.is_nested:
         if not custom_contents_provided:
             def indented_str(s, indent):
                 return "\n".join(f"  {line}" for line in s.split("\n"))
             strs = ",\n".join(indented_str(str(t), indent + 1) for t in torch.ops.aten.unbind.int(self, 0))
             tensor_str = f"[\n{strs}\n]"
     elif torch._is_functional_tensor(self):
         prefix = "_to_functional_tensor("
         tensor_str = repr(torch._from_functional_tensor(self))
     else:
         if self.is_meta:
             suffixes.append('size=' + str(tuple(self.shape)))
             if self.dtype != torch.get_default_dtype():
                 suffixes.append('dtype=' + str(self.dtype))
             # TODO: This implies that ellipses is valid syntax for allocating
             # a meta tensor, which it could be, but it isn't right now
             if not custom_contents_provided:
                 tensor_str = '...'
         else:
             if self.numel() == 0 and not self.is_sparse:
                 # Explicitly print the shape if it is not (0,), to match NumPy behavior
                 if self.dim() != 1:
                     suffixes.append('size=' + str(tuple(self.shape)))

                 # In an empty tensor, there are no elements to infer if the dtype
                 # should be int64, so it must be shown explicitly.
                 if self.dtype != torch.get_default_dtype():
                     suffixes.append('dtype=' + str(self.dtype))
                 if not custom_contents_provided:
                     tensor_str = '[]'
             else:
                 if not has_default_dtype:
                     suffixes.append('dtype=' + str(self.dtype))

                 if not custom_contents_provided:
                     if self.layout != torch.strided:
                         tensor_str = _tensor_str(self.to_dense(), indent)
                     else:
                         tensor_str = _tensor_str(self, indent)

     if self.layout != torch.strided:
         suffixes.append('layout=' + str(self.layout))

     # Use inp here to get the original grad_fn and not the one generated by the forward grad
     # unpacking.
     if inp.grad_fn is not None:
         name = type(inp.grad_fn).__name__
         if name == 'CppFunction':
             name = inp.grad_fn.name().rsplit('::', 1)[-1]
         suffixes.append('grad_fn=<{}>'.format(name))
     elif inp.requires_grad:
         suffixes.append('requires_grad=True')

     if self.has_names():
         suffixes.append('names={}'.format(self.names))

     if tangent is not None:
         suffixes.append('tangent={}'.format(tangent))

     string_repr = _add_suffixes(prefix + tensor_str, suffixes, indent, force_newline=self.is_sparse)

     # Check if this instance is flagged as a parameter and change the repr accordingly.
     # Unfortunately, this function has to be aware of this detail.
     # NB: This is currently skipped for plain tensor parameters to maintain BC. In the future,
     # this should be done for those as well to produce a valid repr.
     if isinstance(self, torch.nn.Parameter) and not is_plain_tensor:
         string_repr = f"Parameter({string_repr})"

     return string_repr

 def _str(self, *, tensor_contents=None):
     with torch.no_grad():
         return _str_intern(self, tensor_contents=tensor_contents)
	import math
	import torch
	from torch._six import inf
	from typing import Optional


	class __PrinterOptions(object):
	precision: int = 4
	threshold: float = 1000
	edgeitems: int = 3
	linewidth: int = 80
	sci_mode: Optional[bool] = None


	PRINT_OPTS = __PrinterOptions()


	# We could use **kwargs, but this will give better docs
	def set_printoptions(
	precision=None,
	threshold=None,
	edgeitems=None,
	linewidth=None,
	profile=None,
	sci_mode=None
	):
	r"""Set options for printing. Items shamelessly taken from NumPy

	Args:
	precision: Number of digits of precision for floating point output
	(default = 4).
	threshold: Total number of array elements which trigger summarization
	rather than full `repr` (default = 1000).
	edgeitems: Number of array items in summary at beginning and end of
	each dimension (default = 3).
	linewidth: The number of characters per line for the purpose of
	inserting line breaks (default = 80). Thresholded matrices will
	ignore this parameter.
	profile: Sane defaults for pretty printing. Can override with any of
	the above options. (any one of `default`, `short`, `full`)
	sci_mode: Enable (True) or disable (False) scientific notation. If
	None (default) is specified, the value is defined by
	`torch._tensor_str._Formatter`. This value is automatically chosen
	by the framework.

	Example::

	>>> torch.set_printoptions(precision=2)
	>>> torch.tensor([1.12345])
	tensor([1.12])
	>>> torch.set_printoptions(threshold=5)
	>>> torch.arange(10)
	tensor([0, 1, 2, ..., 7, 8, 9])

	"""
	if profile is not None:
	if profile == "default":
	PRINT_OPTS.precision = 4
	PRINT_OPTS.threshold = 1000
	PRINT_OPTS.edgeitems = 3
	PRINT_OPTS.linewidth = 80
	elif profile == "short":
	PRINT_OPTS.precision = 2
	PRINT_OPTS.threshold = 1000
	PRINT_OPTS.edgeitems = 2
	PRINT_OPTS.linewidth = 80
	elif profile == "full":
	PRINT_OPTS.precision = 4
	PRINT_OPTS.threshold = inf
	PRINT_OPTS.edgeitems = 3
	PRINT_OPTS.linewidth = 80

	if precision is not None:
	PRINT_OPTS.precision = precision
	if threshold is not None:
	PRINT_OPTS.threshold = threshold
	if edgeitems is not None:
	PRINT_OPTS.edgeitems = edgeitems
	if linewidth is not None:
	PRINT_OPTS.linewidth = linewidth
	PRINT_OPTS.sci_mode = sci_mode

	def tensor_totype(t):
	dtype = torch.float if t.is_mps else torch.double
	return t.to(dtype=dtype)

	class _Formatter(object):
	def __init__(self, tensor):
	self.floating_dtype = tensor.dtype.is_floating_point
	self.int_mode = True
	self.sci_mode = False
	self.max_width = 1

	with torch.no_grad():
	tensor_view = tensor.reshape(-1)

	if not self.floating_dtype:
	for value in tensor_view:
	value_str = '{}'.format(value)
	self.max_width = max(self.max_width, len(value_str))

	else:
	nonzero_finite_vals = torch.masked_select(tensor_view, torch.isfinite(tensor_view) & tensor_view.ne(0))

	if nonzero_finite_vals.numel() == 0:
	# no valid number, do nothing
	return

	# Convert to double for easy calculation. HalfTensor overflows with 1e8, and there's no div() on CPU.
	nonzero_finite_abs = tensor_totype(nonzero_finite_vals.abs())
	nonzero_finite_min = tensor_totype(nonzero_finite_abs.min())
	nonzero_finite_max = tensor_totype(nonzero_finite_abs.max())

	for value in nonzero_finite_vals:
	if value != torch.ceil(value):
	self.int_mode = False
	break

	if self.int_mode:
	# in int_mode for floats, all numbers are integers, and we append a decimal to nonfinites
	# to indicate that the tensor is of floating type. add 1 to the len to account for this.
	if nonzero_finite_max / nonzero_finite_min > 1000. or nonzero_finite_max > 1.e8:
	self.sci_mode = True
	for value in nonzero_finite_vals:
	value_str = ('{{:.{}e}}').format(PRINT_OPTS.precision).format(value)
	self.max_width = max(self.max_width, len(value_str))
	else:
	for value in nonzero_finite_vals:
	value_str = ('{:.0f}').format(value)
	self.max_width = max(self.max_width, len(value_str) + 1)
	else:
	# Check if scientific representation should be used.
	if nonzero_finite_max / nonzero_finite_min > 1000.\
	or nonzero_finite_max > 1.e8\
	or nonzero_finite_min < 1.e-4:
	self.sci_mode = True
	for value in nonzero_finite_vals:
	value_str = ('{{:.{}e}}').format(PRINT_OPTS.precision).format(value)
	self.max_width = max(self.max_width, len(value_str))
	else:
	for value in nonzero_finite_vals:
	value_str = ('{{:.{}f}}').format(PRINT_OPTS.precision).format(value)
	self.max_width = max(self.max_width, len(value_str))

	if PRINT_OPTS.sci_mode is not None:
	self.sci_mode = PRINT_OPTS.sci_mode

	def width(self):
	return self.max_width

	def format(self, value):
	if self.floating_dtype:
	if self.sci_mode:
	ret = ('{{:{}.{}e}}').format(self.max_width, PRINT_OPTS.precision).format(value)
	elif self.int_mode:
	ret = '{:.0f}'.format(value)
	if not (math.isinf(value) or math.isnan(value)):
	ret += '.'
	else:
	ret = ('{{:.{}f}}').format(PRINT_OPTS.precision).format(value)
	else:
	ret = '{}'.format(value)
	return (self.max_width - len(ret)) * ' ' + ret


	def _scalar_str(self, formatter1, formatter2=None):
	if formatter2 is not None:
	real_str = _scalar_str(self.real, formatter1)
	imag_str = (_scalar_str(self.imag, formatter2) + "j").lstrip()
	# handles negative numbers, +0.0, -0.0
	if imag_str[0] == '+' or imag_str[0] == '-':
	return real_str + imag_str
	else:
	return real_str + "+" + imag_str
	else:
	return formatter1.format(self.item())

	def _vector_str(self, indent, summarize, formatter1, formatter2=None):
	# length includes spaces and comma between elements
	element_length = formatter1.width() + 2
	if formatter2 is not None:
	# width for imag_formatter + an extra j for complex
	element_length += formatter2.width() + 1

	elements_per_line = max(1, int(math.floor((PRINT_OPTS.linewidth - indent) / (element_length))))
	char_per_line = element_length * elements_per_line

	def _val_formatter(val, formatter1=formatter1, formatter2=formatter2):
	if formatter2 is not None:
	real_str = formatter1.format(val.real)
	imag_str = (formatter2.format(val.imag) + "j").lstrip()
	# handles negative numbers, +0.0, -0.0
	if imag_str[0] == '+' or imag_str[0] == '-':
	return real_str + imag_str
	else:
	return real_str + "+" + imag_str
	else:
	return formatter1.format(val)

	if summarize and self.size(0) > 2 * PRINT_OPTS.edgeitems:
	data = ([_val_formatter(val) for val in self[:PRINT_OPTS.edgeitems].tolist()] +
	[' ...'] +
	[_val_formatter(val) for val in self[-PRINT_OPTS.edgeitems:].tolist()])
	else:
	data = [_val_formatter(val) for val in self.tolist()]

	data_lines = [data[i:i + elements_per_line] for i in range(0, len(data), elements_per_line)]
	lines = [', '.join(line) for line in data_lines]
	return '[' + (',' + '\n' + ' ' * (indent + 1)).join(lines) + ']'

	# formatter2 is only used for printing complex tensors.
	# For complex tensors, formatter1 and formatter2 are the formatters for tensor.real
	# and tensor.imag respesectively
	def _tensor_str_with_formatter(self, indent, summarize, formatter1, formatter2=None):
	dim = self.dim()

	if dim == 0:
	return _scalar_str(self, formatter1, formatter2)

	if dim == 1:
	return _vector_str(self, indent, summarize, formatter1, formatter2)

	if summarize and self.size(0) > 2 * PRINT_OPTS.edgeitems:
	slices = ([_tensor_str_with_formatter(self[i], indent + 1, summarize, formatter1, formatter2)
	for i in range(0, PRINT_OPTS.edgeitems)] +
	['...'] +
	[_tensor_str_with_formatter(self[i], indent + 1, summarize, formatter1, formatter2)
	for i in range(len(self) - PRINT_OPTS.edgeitems, len(self))])
	else:
	slices = [_tensor_str_with_formatter(self[i], indent + 1, summarize, formatter1, formatter2)
	for i in range(0, self.size(0))]

	tensor_str = (',' + '\n' * (dim - 1) + ' ' * (indent + 1)).join(slices)
	return '[' + tensor_str + ']'

	def _tensor_str(self, indent):
	if self.numel() == 0:
	return '[]'

	if self.has_names():
	# There are two main codepaths (possibly more) that tensor printing goes through:
	# - tensor data can fit comfortably on screen
	# - tensor data needs to be summarized
	# Some of the codepaths don't fully support named tensors, so we send in
	# an unnamed tensor to the formatting code as a workaround.
	self = self.rename(None)

	summarize = self.numel() > PRINT_OPTS.threshold

	if self._is_zerotensor():
	self = self.clone()

	# handle the negative bit
	if self.is_neg():
	self = self.resolve_neg()

	if self.dtype is torch.float16 or self.dtype is torch.bfloat16:
	self = self.float()

	if self.dtype is torch.complex32:
	self = self.cfloat()

	if self.dtype.is_complex:
	# handle the conjugate bit
	self = self.resolve_conj()
	real_formatter = _Formatter(get_summarized_data(self.real) if summarize else self.real)
	imag_formatter = _Formatter(get_summarized_data(self.imag) if summarize else self.imag)
	return _tensor_str_with_formatter(self, indent, summarize, real_formatter, imag_formatter)
	else:
	formatter = _Formatter(get_summarized_data(self) if summarize else self)
	return _tensor_str_with_formatter(self, indent, summarize, formatter)

	def _add_suffixes(tensor_str, suffixes, indent, force_newline):
	tensor_strs = [tensor_str]
	last_line_len = len(tensor_str) - tensor_str.rfind('\n') + 1
	for suffix in suffixes:
	suffix_len = len(suffix)
	if force_newline or last_line_len + suffix_len + 2 > PRINT_OPTS.linewidth:
	tensor_strs.append(',\n' + ' ' * indent + suffix)
	last_line_len = indent + suffix_len
	force_newline = False
	else:
	tensor_strs.append(', ' + suffix)
	last_line_len += suffix_len + 2
	tensor_strs.append(')')
	return ''.join(tensor_strs)


	def get_summarized_data(self):
	dim = self.dim()
	if dim == 0:
	return self
	if dim == 1:
	if self.size(0) > 2 * PRINT_OPTS.edgeitems:
	return torch.cat((self[:PRINT_OPTS.edgeitems], self[-PRINT_OPTS.edgeitems:]))
	else:
	return self
	if self.size(0) > 2 * PRINT_OPTS.edgeitems:
	start = [self[i] for i in range(0, PRINT_OPTS.edgeitems)]
	end = ([self[i]
	for i in range(len(self) - PRINT_OPTS.edgeitems, len(self))])
	return torch.stack([get_summarized_data(x) for x in (start + end)])
	else:
	return torch.stack([get_summarized_data(x) for x in self])

	def _str_intern(inp, *, tensor_contents=None):
	is_plain_tensor = type(inp) is torch.Tensor or type(inp) is torch.nn.Parameter
	if inp.is_nested:
	prefix = "nested_tensor("
	elif is_plain_tensor:
	prefix = 'tensor('
	else:
	prefix = f"{type(inp).__name__}("
	indent = len(prefix)
	suffixes = []
	custom_contents_provided = tensor_contents is not None
	if custom_contents_provided:
	tensor_str = tensor_contents

	# This is used to extract the primal value and thus disable the forward AD
	# within this function.
	# TODO(albanD) This needs to be updated when more than one level is supported
	self, tangent = torch.autograd.forward_ad.unpack_dual(inp)

	# Note [Print tensor device]:
	# A general logic here is we only print device when it doesn't match
	# the device specified in default tensor type.
	# Currently torch.set_default_tensor_type() only supports CPU/CUDA, thus
	# torch._C._get_default_device() only returns either cpu or cuda.
	# In other cases, we don't have a way to set them as default yet,
	# and we should always print out device for them.
	if self.device.type != torch._C._get_default_device()\
	or (self.device.type == 'cuda' and torch.cuda.current_device() != self.device.index)\
	or (self.device.type == 'mps'):
	suffixes.append('device=\'' + str(self.device) + '\'')

	# Tensor printing performs tensor operations like slice, indexing, etc to make it in a
	# representable format. These operations on ipu/xla/lazy tensor results in compilations. Hence,
	# to avoid compilations, copying the tensor to cpu before printing.
	if self.device.type in ['xla', 'lazy', 'ipu']:
	self = self.to('cpu')

	# TODO: add an API to map real -> complex dtypes
	_default_complex_dtype = torch.cdouble if torch.get_default_dtype() == torch.double else torch.cfloat
	has_default_dtype = self.dtype in (torch.get_default_dtype(), _default_complex_dtype, torch.int64, torch.bool)
	if self.is_sparse:
	suffixes.append('size=' + str(tuple(self.shape)))
	suffixes.append('nnz=' + str(self._nnz()))
	if not has_default_dtype:
	suffixes.append('dtype=' + str(self.dtype))
	if not custom_contents_provided:
	indices_prefix = 'indices=tensor('
	indices = self._indices().detach()
	indices_str = _tensor_str(indices, indent + len(indices_prefix))
	if indices.numel() == 0:
	indices_str += ', size=' + str(tuple(indices.shape))
	values_prefix = 'values=tensor('
	values = self._values().detach()
	values_str = _tensor_str(values, indent + len(values_prefix))
	if values.numel() == 0:
	values_str += ', size=' + str(tuple(values.shape))
	tensor_str = indices_prefix + indices_str + '),\n' + ' ' * indent + values_prefix + values_str + ')'
	elif self.layout in {torch.sparse_csr, torch.sparse_csc, torch.sparse_bsr, torch.sparse_bsc}:
	suffixes.append('size=' + str(tuple(self.shape)))
	suffixes.append('nnz=' + str(self._nnz()))
	if not has_default_dtype:
	suffixes.append('dtype=' + str(self.dtype))
	if not custom_contents_provided:
	compressed_indices_method, plain_indices_method = {
	torch.sparse_csr: (torch.Tensor.crow_indices, torch.Tensor.col_indices),
	torch.sparse_csc: (torch.Tensor.ccol_indices, torch.Tensor.row_indices),
	torch.sparse_bsr: (torch.Tensor.crow_indices, torch.Tensor.col_indices),
	torch.sparse_bsc: (torch.Tensor.ccol_indices, torch.Tensor.row_indices),
	}[self.layout]
	if self.layout in {torch.sparse_csr, torch.sparse_bsr}:
	cdimname, pdimname = 'row', 'column'
	else:
	cdimname, pdimname = 'column', 'row'
	compressed_indices_prefix = f'c{cdimname[:3]}_indices=tensor('
	compressed_indices = compressed_indices_method(self).detach()
	compressed_indices_str = _tensor_str(compressed_indices, indent + len(compressed_indices_prefix))
	if compressed_indices.numel() == 0:
	compressed_indices_str += ', size=' + str(tuple(compressed_indices.shape))
	plain_indices_prefix = f'{pdimname[:3]}_indices=tensor('
	plain_indices = plain_indices_method(self).detach()
	plain_indices_str = _tensor_str(plain_indices, indent + len(plain_indices_prefix))
	if plain_indices.numel() == 0:
	plain_indices_str += ', size=' + str(tuple(plain_indices.shape))
	values_prefix = 'values=tensor('
	values = self.values().detach()
	values_str = _tensor_str(values, indent + len(values_prefix))
	if values.numel() == 0:
	values_str += ', size=' + str(tuple(values.shape))
	tensor_str = compressed_indices_prefix + compressed_indices_str + '),\n' + ' ' * indent +\
	plain_indices_prefix + plain_indices_str + '),\n' + ' ' * indent +\
	values_prefix + values_str + ')'
	elif self.is_quantized:
	suffixes.append('size=' + str(tuple(self.shape)))
	if not has_default_dtype:
	suffixes.append('dtype=' + str(self.dtype))
	suffixes.append('quantization_scheme=' + str(self.qscheme()))
	if self.qscheme() == torch.per_tensor_affine or self.qscheme() == torch.per_tensor_symmetric:
	suffixes.append('scale=' + str(self.q_scale()))
	suffixes.append('zero_point=' + str(self.q_zero_point()))
	elif self.qscheme() == torch.per_channel_affine or self.qscheme() == torch.per_channel_symmetric \
	or self.qscheme() == torch.per_channel_affine_float_qparams:
	suffixes.append('scale=' + str(self.q_per_channel_scales()))
	suffixes.append('zero_point=' + str(self.q_per_channel_zero_points()))
	suffixes.append('axis=' + str(self.q_per_channel_axis()))
	if not custom_contents_provided:
	tensor_str = _tensor_str(self.dequantize(), indent)
	elif self.is_nested:
	if not custom_contents_provided:
	def indented_str(s, indent):
	return "\n".join(f" {line}" for line in s.split("\n"))
	strs = ",\n".join(indented_str(str(t), indent + 1) for t in torch.ops.aten.unbind.int(self, 0))
	tensor_str = f"[\n{strs}\n]"
	elif torch._is_functional_tensor(self):
	prefix = "_to_functional_tensor("
	tensor_str = repr(torch._from_functional_tensor(self))
	else:
	if self.is_meta:
	suffixes.append('size=' + str(tuple(self.shape)))
	if self.dtype != torch.get_default_dtype():
	suffixes.append('dtype=' + str(self.dtype))
	# TODO: This implies that ellipses is valid syntax for allocating
	# a meta tensor, which it could be, but it isn't right now
	if not custom_contents_provided:
	tensor_str = '...'
	else:
	if self.numel() == 0 and not self.is_sparse:
	# Explicitly print the shape if it is not (0,), to match NumPy behavior
	if self.dim() != 1:
	suffixes.append('size=' + str(tuple(self.shape)))

	# In an empty tensor, there are no elements to infer if the dtype
	# should be int64, so it must be shown explicitly.
	if self.dtype != torch.get_default_dtype():
	suffixes.append('dtype=' + str(self.dtype))
	if not custom_contents_provided:
	tensor_str = '[]'
	else:
	if not has_default_dtype:
	suffixes.append('dtype=' + str(self.dtype))

	if not custom_contents_provided:
	if self.layout != torch.strided:
	tensor_str = _tensor_str(self.to_dense(), indent)
	else:
	tensor_str = _tensor_str(self, indent)

	if self.layout != torch.strided:
	suffixes.append('layout=' + str(self.layout))

	# Use inp here to get the original grad_fn and not the one generated by the forward grad
	# unpacking.
	if inp.grad_fn is not None:
	name = type(inp.grad_fn).__name__
	if name == 'CppFunction':
	name = inp.grad_fn.name().rsplit('::', 1)[-1]
	suffixes.append('grad_fn=<{}>'.format(name))
	elif inp.requires_grad:
	suffixes.append('requires_grad=True')

	if self.has_names():
	suffixes.append('names={}'.format(self.names))

	if tangent is not None:
	suffixes.append('tangent={}'.format(tangent))

	string_repr = _add_suffixes(prefix + tensor_str, suffixes, indent, force_newline=self.is_sparse)

	# Check if this instance is flagged as a parameter and change the repr accordingly.
	# Unfortunately, this function has to be aware of this detail.
	# NB: This is currently skipped for plain tensor parameters to maintain BC. In the future,
	# this should be done for those as well to produce a valid repr.
	if isinstance(self, torch.nn.Parameter) and not is_plain_tensor:
	string_repr = f"Parameter({string_repr})"

	return string_repr

	def _str(self, *, tensor_contents=None):
	with torch.no_grad():
	return _str_intern(self, tensor_contents=tensor_contents)