Skip to content

Commit 461a66b

Browse files
native Query DSL format
1 parent 804108f commit 461a66b

File tree

2 files changed

+26
-12
lines changed

2 files changed

+26
-12
lines changed

README.rst

+10-2
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ es2csv
44
A CLI tool for exporting data from Elasticsearch into a CSV file
55
----------------------------------------------------------------
66

7-
Command line utility, written in Python, for querying Elasticsearch in Lucene query syntax and for exporting documents into a CSV file. This tool can query bulk docs in multiple indices and get only selected fields, this reduces query execution time.
7+
Command line utility, written in Python, for querying Elasticsearch in Lucene query syntax or Query DSL syntax and exporting result as documents into a CSV file. This tool can query bulk docs in multiple indices and get only selected fields, this reduces query execution time.
88

99
Quick Look Demo
1010
---------------
@@ -31,7 +31,7 @@ Usage
3131
3232
$ es2csv [-h] -q QUERY [-u URL] [-i INDEX [INDEX ...]]
3333
[-t TAGS [TAGS ...]] -o FILE [-f FIELDS [FIELDS ...]]
34-
[-d DELIMITER] [-m INTEGER] [-k] [--debug]
34+
[-d DELIMITER] [-m INTEGER] [-k] [-r] [-v] [--debug]
3535
3636
Arguments:
3737
-q, --query QUERY Query string in Lucene syntax. [required]
@@ -43,6 +43,8 @@ Usage
4343
-d, --delimiter DELIMITER Delimiter to use in CSV file. Default is ",".
4444
-m, --max INTEGER Maximum number of results to return. Default is 0.
4545
-k, --kibana_nested Format nested fields in Kibana style.
46+
-r, --raw_query Switch query format in the Query DSL.
47+
-v, --version Show version and exit.
4648
--debug Debug mode on.
4749
-h, --help show this help message and exit
4850
@@ -53,6 +55,12 @@ Searching on localhost and save to database.csv
5355
.. code-block:: bash
5456
5557
$ es2csv -q 'host: localhost' -o database.csv
58+
59+
Same in Query DSL syntax
60+
61+
.. code-block:: bash
62+
63+
$ es2csv -r -q '{"query": {"match": {"host": "localhost"}}}' -o database.csv
5664
5765
With tag
5866

es2csv.py

+16-10
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,14 @@
11
#!/usr/bin/env python
22
"""
33
title: A CLI tool for exporting data from Elasticsearch into a CSV file.
4-
description: Command line utility, written in Python, for querying Elasticsearch in Lucene query syntax and for exporting documents into a CSV file.
4+
description: Command line utility, written in Python, for querying Elasticsearch in Lucene query syntax or Query DSL syntax and exporting result as documents into a CSV file.
55
usage: es2csv -q '*' -i _all -o ~/file.csv -k -m 100
6+
es2csv -q '{"query": {"match_all": {}}}' -r -i _all -o ~/file.csv
67
es2csv -q '*' -i logstash-2015-01-* -f host status message -o ~/file.csv
78
es2csv -q 'host: localhost' -i logstash-2015-01-01 logstash-2015-01-02 -f host status message -o ~/file.csv
89
es2csv -q 'host: localhost AND status: GET' -u http://kibana.com:80/es/ -o ~/file.csv
910
es2csv -q '*' -t dev prod -u http://login:[email protected]:6666/es/ -o ~/file.csv
11+
es2csv -q '{"query": {"match_all": {}}, "filter":{"term": {"tags": "dev"}}}' -r -u http://login:[email protected]:6666/es/ -o ~/file.csv
1012
"""
1113
import os
1214
import sys
@@ -85,25 +87,28 @@ def check_indexes(self):
8587

8688
@retry(elasticsearch.exceptions.ConnectionError, tries=TIMES_TO_TRY)
8789
def search_query(self):
88-
query = self.opts.query if not self.opts.tags else '%s AND tags:%s' % (
89-
self.opts.query, '(%s)' % ' AND '.join(self.opts.tags))
90-
91-
if self.opts.debug_mode:
92-
print('Using these indices: %s' % ', '.join(self.opts.index_prefixes))
93-
print('Query: %s' % query)
94-
print('Output field(s): %s' % ', '.join(self.opts.fields))
95-
9690
search_args = dict(
9791
index=','.join(self.opts.index_prefixes),
98-
q=query,
9992
search_type='scan',
10093
scroll=self.scroll_time,
10194
size=self.scroll_size
10295
)
96+
if self.opts.raw_query:
97+
query = json.loads(self.opts.query)
98+
search_args['body'] = query
99+
else:
100+
query = self.opts.query if not self.opts.tags else '%s AND tags:%s' % (
101+
self.opts.query, '(%s)' % ' AND '.join(self.opts.tags))
102+
search_args['q'] = query
103103

104104
if '_all' not in self.opts.fields:
105105
search_args['fields'] = ','.join(self.opts.fields)
106106

107+
if self.opts.debug_mode:
108+
print('Using these indices: %s' % ', '.join(self.opts.index_prefixes))
109+
print('Query[%s]: %s' % (('Query DSL', json.dumps(query)) if self.opts.raw_query else ('Lucene', query)))
110+
print('Output field(s): %s' % ', '.join(self.opts.fields))
111+
107112
res = self.es_conn.search(**search_args)
108113

109114
self.scroll_ids.append(res['_scroll_id'])
@@ -236,6 +241,7 @@ def main():
236241
p.add_argument('-d', '--delimiter', dest='delimiter', default=',', type=str, help='Delimiter to use in CSV file. Default is "%(default)s".')
237242
p.add_argument('-m', '--max', dest='max_results', default=0, type=int, metavar='INTEGER', help='Maximum number of results to return. Default is %(default)s.')
238243
p.add_argument('-k', '--kibana_nested', dest='kibana_nested', action='store_true', help='Format nested fields in Kibana style.')
244+
p.add_argument('-r', '--raw_query', dest='raw_query', action='store_true', help='Switch query format in the Query DSL.')
239245
p.add_argument('-v', '--version', action='version', version='%(prog)s ' + __version__, help='Show version and exit.')
240246
p.add_argument('--debug', dest='debug_mode', action='store_true', help='Debug mode on.')
241247

0 commit comments

Comments
 (0)