Source code for cr.nimble._src.compression.run_length
# Copyright 2022 CR-Suite Development Team
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
Run Length Encoding
References:
https://stackoverflow.com/questions/1066758/find-length-of-sequences-of-identical-values-in-a-numpy-array-run-length-encodi
"""
import numpy as np
[docs]def count_runs_values(input_arr):
"""Computes run lengths of an array of integers
"""
# make sure that input is a numpy array
input_arr = np.asarray(input_arr)
n = len(input_arr)
if n == 0:
return (np.empty(0),np.empty(0))
if n == 1:
return (np.ones(1), input_arr)
# locate the changes
changes = input_arr[1:] != input_arr[:-1]
changes, = np.where(changes)
# the last position should always be recorded as a change
changes = np.append(changes, n-1)
values = input_arr[changes]
changes = np.insert(changes, 0, -1)
# run lengths can be computed now
runs = np.diff(changes)
return runs, values
[docs]def expand_runs_values(runs, values):
"""Decodes run lengths to form an array of integers
"""
return np.concatenate(
[v * np.ones(r, dtype=np.int32)
for r, v in zip(runs, values)])