import logging
import struct
import numpy as np
from pylas import extradims
from pylas.vlrs.known import ExtraBytesStruct, ExtraBytesVlr
from .. import errors
from ..compression import (
uncompressed_id_to_compressed,
lazperf_compress_points,
lazrs_compress_points,
LasZipProcess
)
from ..point import record, dims, PointFormat
from ..utils import ConveyorThread
from ..vlrs import known, vlrlist
logger = logging.getLogger(__name__)
[docs]def scale_dimension(array_dim, scale, offset):
return (array_dim * scale) + offset
[docs]def unscale_dimension(array_dim, scale, offset):
return np.round((np.array(array_dim) - offset) / scale)
[docs]def is_in_bounds_of_type(array, type_info):
return array.max() < type_info.max and array.min() > type_info.min
OVERFLOW_ERR_MSG = "Values given for '{}' won't fit in an {} array, with the current scale ({})"
[docs]class LasBase(object):
""" LasBase is the base of all the different LasData classes.
These classes are objects that the user will interact with to manipulate las data.
It connects the point record, header, vlrs together.
To access points dimensions using this class you have two possibilities
.. code:: python
las = pylas.read('some_file.las')
las.classification
# or
las['classification']
.. note::
using las['dimension_name'] is not possible with the scaled values of x, y, z
"""
def __init__(self, *, header, vlrs=None, points=None):
if points is None:
points = record.PackedPointRecord.empty(PointFormat(header.point_format_id))
self.__dict__["points_data"] = points
self.header = header
self.vlrs = vlrs if vlrs is not None else vlrlist.VLRList()
@property
def x(self):
""" Returns the scaled x positions of the points as doubles
"""
return scale_dimension(self.X, self.header.x_scale, self.header.x_offset)
@property
def y(self):
""" Returns the scaled y positions of the points as doubles
"""
return scale_dimension(self.Y, self.header.y_scale, self.header.y_offset)
@property
def z(self):
""" Returns the scaled z positions of the points as doubles
"""
return scale_dimension(self.Z, self.header.z_scale, self.header.z_offset)
@x.setter
def x(self, value):
if self.header.x_offset == 0.0:
self.header.x_offset = np.min(value)
X = unscale_dimension(value, self.header.x_scale, self.header.x_offset)
dim_info = self.point_format.dimension_type_info('X')
if not is_in_bounds_of_type(X, dim_info):
raise OverflowError(OVERFLOW_ERR_MSG.format('x', dim_info.dtype, self.header.x_scale))
self.X = X
@y.setter
def y(self, value):
if self.header.y_offset == 0.0:
self.header.y_offset = np.min(value)
Y = unscale_dimension(value, self.header.y_scale, self.header.y_offset)
dim_info = self.point_format.dimension_type_info('Y')
if not is_in_bounds_of_type(Y, dim_info):
raise OverflowError(OVERFLOW_ERR_MSG.format('y', dim_info.dtype, self.header.y_scale))
self.Y = Y
@z.setter
def z(self, value):
if self.header.z_offset == 0.0:
self.header.z_offset = np.min(value)
Z = unscale_dimension(value, self.header.z_scale, self.header.z_offset)
dim_info = self.point_format.dimension_type_info('Z')
if not is_in_bounds_of_type(Z, dim_info):
raise OverflowError(OVERFLOW_ERR_MSG.format('z', dim_info.dtype, self.header.z_scale))
self.Z = Z
@property
def point_format(self):
return self.points_data.point_format
@property
def points(self):
""" returns the numpy array representing the points
Returns
-------
the Numpy structured array of points
"""
return self.points_data.array
@points.setter
def points(self, value):
""" Setter for the points property,
Takes care of changing the point_format of the file
(as long as the point format of the new points it compatible with the file version)
Parameters
----------
value: numpy.array of the new points
"""
if value.dtype != self.points.dtype:
raise errors.IncompatibleDataFormat('Cannot set points with a different point format, convert first')
new_point_record = record.PackedPointRecord(value, self.points_data.point_format)
dims.raise_if_version_not_compatible_with_fmt(
new_point_record.point_format.id, self.header.version
)
self.points_data = new_point_record
self.update_header()
def __getattr__(self, item):
""" Automatically called by Python when the attribute
named 'item' is no found. We use this function to forward the call the
point record. This is the mechanism used to allow the users to access
the points dimensions directly through a LasData.
Parameters
----------
item: str
name of the attribute, should be a dimension name
Returns
-------
The requested dimension if it exists
"""
return self.points_data[item]
def __setattr__(self, key, value):
""" This is called on every access to an attribute of the instance.
Again we use this to forward the call the the points record
But this time checking if the key is actually a dimension name
so that an error is raised if the user tries to set a valid
LAS dimension even if it is not present in the field.
eg: user tries to set the red field of a file with point format 0:
an error is raised
"""
if key in dims.DIMENSIONS or key in self.points_data.all_dimensions_names:
self.points_data[key] = value
else:
super().__setattr__(key, value)
def __getitem__(self, item):
return self.points_data[item]
def __setitem__(self, key, value):
self.points_data[key] = value
[docs] def write_to(self, out_stream, do_compress=False):
""" writes the data to a stream
Parameters
----------
out_stream: file object
the destination stream, implementing the write method
do_compress: bool, optional, default False
Flag to indicate if you want the date to be compressed
"""
self.update_header()
if (
self.vlrs.get("ExtraBytesVlr")
and not self.points_data.extra_dimensions_names
):
logger.error(
"Las contains an ExtraBytesVlr, but no extra bytes were found in the point_record, "
"removing the vlr"
)
self.vlrs.extract("ExtraBytesVlr")
if do_compress:
try:
compressed_points_buf, vlr_data = lazrs_compress_points(self.points_data)
except errors.LazError as e:
try:
logger.error("pylaz failed to compress: {}".format(e))
compressed_points_buf, vlr_data = lazperf_compress_points(self.points_data)
except errors.LazError as e:
logger.error("lazperf failed to compress: {}".format(e))
self._compress_with_laszip_executable(out_stream)
return
self.vlrs.append(known.LasZipVlr(vlr_data))
raw_vlrs = vlrlist.RawVLRList.from_list(self.vlrs)
self.header.offset_to_point_data = (
self.header.size + raw_vlrs.total_size_in_bytes()
)
self.header.point_format_id = uncompressed_id_to_compressed(
self.header.point_format_id
)
self.header.number_of_vlr = len(raw_vlrs)
# Update Chunk table offset from being from the start of point data
# to the start of the file
points_bytes = bytearray(compressed_points_buf.tobytes())
offset_to_chunk_table = struct.unpack_from("<q", points_bytes, 0)[0]
struct.pack_into("<q", points_bytes, 0, self.header.offset_to_point_data + offset_to_chunk_table)
else:
raw_vlrs = vlrlist.RawVLRList.from_list(self.vlrs)
self.header.number_of_vlr = len(raw_vlrs)
self.header.offset_to_point_data = (
self.header.size + raw_vlrs.total_size_in_bytes()
)
points_bytes = self.points_data.memoryview()
self.header.write_to(out_stream)
self._raise_if_not_expected_pos(out_stream, self.header.size)
raw_vlrs.write_to(out_stream)
self._raise_if_not_expected_pos(out_stream, self.header.offset_to_point_data)
out_stream.write(points_bytes)
@staticmethod
def _raise_if_not_expected_pos(stream, expected_pos):
if not stream.tell() == expected_pos:
raise RuntimeError(
"Writing, expected to be at pos {} but stream is at pos {}".format(
expected_pos, stream.tell()
)
)
[docs] def write_to_file(self, filename, do_compress=None):
""" Writes the las data into a file
Parameters
----------
filename : str
The file where the data should be written.
do_compress: bool, optional, default None
if None the extension of the filename will be used
to determine if the data should be compressed
otherwise the do_compress flag indicate if the data should be compressed
"""
is_ext_laz = filename.split(".")[-1] == "laz"
if is_ext_laz and do_compress is None:
do_compress = True
with open(filename, mode="wb") as out:
self.write_to(out, do_compress=do_compress)
[docs] def write(self, destination, do_compress=None):
""" Writes to a stream or file
When destination is a string, it will be interpreted as the path were the file should be written to,
also if do_compress is None, the compression will be guessed from the file extension:
- .laz -> compressed
- .las -> uncompressed
.. note::
This means that you could do something like:
# Create .laz but not compressed
las.write('out.laz', do_compress=False)
# Create .las but compressed
las.write('out.las', do_compress=True)
While it should not confuse Las/Laz readers, it will confuse humans so avoid doing it
Parameters
----------
destination: str or file object
filename or stream to write to
do_compress: bool, optional
Flags to indicate if you want to compress the data
"""
if isinstance(destination, str):
self.write_to_file(destination)
else:
if do_compress is None:
do_compress = False
self.write_to(destination, do_compress=do_compress)
def _compress_with_laszip_executable(self, out_stream):
try:
out_stream.fileno()
except OSError:
laszip_prc = LasZipProcess(LasZipProcess.Actions.Compress)
out_stream.seek(0)
t = ConveyorThread(laszip_prc.stdout, out_stream)
t.start()
self.write_to(laszip_prc.stdin, do_compress=False)
laszip_prc.stdin.close()
t.join()
laszip_prc.wait()
laszip_prc.raise_if_bad_err_code()
else:
# The ouput is a file
# let laszip write directly to it, to avoid copies
laszip_prc = LasZipProcess(LasZipProcess.Actions.Compress, stdout=out_stream)
self.write_to(laszip_prc.stdin)
laszip_prc.wait_until_finished()
def __repr__(self):
return "<LasData({}.{}, point fmt: {}, {} points, {} vlrs)>".format(
self.header.version_major,
self.header.version_minor,
self.points_data.point_format,
len(self.points_data),
len(self.vlrs),
)