Skip to main content

LZMA

Supported formats

LZMA, Lzip (LZMA), XZ (LZMA2)

Description

LZMA (Lempel-Ziv-Markov chain algorithm) and LZMA2 are data compression algorithms widely known for their high compression ratio and are commonly used in file compression formats. This backend handles formats such as Lzip and XZ, and 7z is handled by its dedicated backend.

info

Available in Contextal Platform 1.0 and later.

Symbols

Object

  • LIMITS_REACHED → limits triggered while processing the stream

Children

  • TOOBIG → the stream was not extracted as it exceeds the limits

Example Metadata

{
"org": "ctx",
"object_id": "964a9c008693dda26b751104fdc88abd18c2ea8f3d5023d5096567ecf04e5f61",
"object_type": "LZMA",
"object_subtype": "XZ",
"recursion_level": 1,
"size": 1656,
"hashes": {
"sha256": "964a9c008693dda26b751104fdc88abd18c2ea8f3d5023d5096567ecf04e5f61",
"sha1": "c206dd9a0df656a1e8af55a9d3cea387e80cc166",
"sha512": "b89341affa54d8d1908f74f84593c862c91c727c677706a80b599d5b9d3e73c530c951b772bde5b6df2529ee128a53548739c50095c6b200ad787fc4da25fc34",
"md5": "531295b352c13cf931d3d8939edac77c"
},
"ctime": 1727280188.640392,
"ok": {
"symbols": [],
"object_metadata": {
"_backend_version": "1.0.0"
},
"children": [
{
"org": "ctx",
"object_id": "c26af93f9d4c468a7b00a6798dde9f80ffb95e090f5a06b4d321bc920e92706a",
"object_type": "Text",
"object_subtype": null,
"recursion_level": 2,
"size": 3614,
"hashes": {
"sha256": "c26af93f9d4c468a7b00a6798dde9f80ffb95e090f5a06b4d321bc920e92706a",
"sha512": "6dcda22e7ff2570fe6d86c4b98aa8230a0c42b91a70161fbd53c11f97dd7fddc64c258b7ab0c540b6d9cf877a682eb01f0e41fe8240d368b78a8c49ca2c6d2f1",
"sha1": "11b688f562b72e65a5484a96bca2e02a68bfc9b4",
"md5": "68a5a022852aedce26106da8b4212455"
},
"ctime": 1727280188.640392,
"relation_metadata": {
"compression_factor": 2.1823671497584543,
"input_size": 1656,
"name": "data.txt",
"output_size": 3614
},
"ok": {
"symbols": [
"ALL_ASCII",
"CC_NUMBER",
"MANY_NUMBERS"
],
"object_metadata": {
"_backend_version": "1.0.0",
"encoding": "utf-8",
"natural_language": "English",
"natural_language_profanity_count": 0,
"natural_language_sentiment": {
"compound": 0.0772283284276542,
"neg": 0,
"neu": 0.993444276348966,
"pos": 0.006555723651033787
},
"number_of_ascii_range_chars": 3614,
"number_of_characters": 3614,
"number_of_digits": 400,
"number_of_newlines": 162,
"number_of_whitespaces": 208,
"number_of_words": 206,
"possible_passwords": [],
"uris": []
},
"children": []
}
}
]
}
}

Example Queries

object_type == "LZMA"
&& @has_child(object_type == "Text"
&& @has_symbol("CC_NUMBER")
)
  • This query matches an LZMA object, from which a Text object with possible credit card number(s) was extracted.

Configuration Options

  • max_child_input_size → maximum size of the input children object (default: 262144000)
  • max_child_output_size → maximum size of the output children object (default: 262144000)