eris- Elasticsearch Recon Ingestion Scripts (ERIS) 🔎 |
git clone git://git.acid.vegas/-c.git |
Log | Files | Refs | Archive | README | LICENSE |
commit a53541c32816b101de86b53faeda96f2799ba82e
parent 78d7556f09284219f77fe28ffa7e401d61a5a09b Author: acidvegas <acid.vegas@acid.vegas> Date: Sat, 23 Mar 2024 14:31:39 -0400 Added zone field too better querying on specific tlds/zones Diffstat:
|
1 file changed, 5 insertions(+), 0 deletions(-) |
diff --git a/ingestors/ingest_zone.py b/ingestors/ingest_zone.py @@ -29,6 +29,7 @@ def construct_map() -> dict: 'mappings': { 'properties': { 'domain' : keyword_mapping, + 'zone' : { 'type': 'keyword' }, 'records' : { 'type': 'nested', 'properties': {} }, 'source' : { 'type': 'keyword' }, 'seen' : { 'type': 'date' } @@ -62,6 +63,9 @@ async def process_data(file_path: str): # Initialize the cache last = None + # Determine the zone name from the file path (e.g., /path/to/zones/com.eu.txt -> com.eu zone) + zone = '.'.join(file_path.split('/')[-1].split('.')[:-1]) + # Read the input file line by line async for line in input_file: line = line.strip() @@ -129,6 +133,7 @@ async def process_data(file_path: str): '_index' : default_index, '_doc' : { 'domain' : domain, + 'zone' : zone, 'records' : {record_type: [{'data': data, 'ttl': ttl}]}, 'source' : 'czds', 'seen' : time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime()) # Zone files do not contain a timestamp, so we use the current time |