1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
|
from __future__ import print_function
import argparse
import datetime
import os
import subprocess
import sys
import tarfile
def extract_kindexes(kindexes):
for kindex in kindexes:
with tarfile.TarFile(kindex) as tf:
for fname in [i for i in tf.getnames() if i.endswith('.kzip')]:
tf.extract(fname)
yield fname
def just_do_it(java, kythe, kythe_to_proto, out_name, binding_only, kindexes):
temp_out_name = out_name + '.temp'
kindex_inputs = list(extract_kindexes(kindexes))
open(temp_out_name, 'w').close()
start = datetime.datetime.now()
for kindex in kindex_inputs:
print('[INFO] Processing:', kindex, file=sys.stderr)
indexer_start = datetime.datetime.now()
p = subprocess.Popen(
[java, '-jar', os.path.join(kythe, 'indexers/java_indexer.jar'), kindex], stdout=subprocess.PIPE
)
indexer_out, _ = p.communicate()
print('[INFO] Indexer execution time:', (
datetime.datetime.now() - indexer_start
).total_seconds(), 'seconds', file=sys.stderr)
if p.returncode:
raise Exception('java_indexer failed with exit code {}'.format(p.returncode))
dedup_start = datetime.datetime.now()
p = subprocess.Popen([os.path.join(kythe, 'tools/dedup_stream')], stdin=subprocess.PIPE, stdout=subprocess.PIPE)
dedup_out, _ = p.communicate(indexer_out)
print('[INFO] Dedup execution time:', (
datetime.datetime.now() - dedup_start
).total_seconds(), 'seconds', file=sys.stderr)
if p.returncode:
raise Exception('dedup_stream failed with exit code {}'.format(p.returncode))
entrystream_start = datetime.datetime.now()
p = subprocess.Popen(
[os.path.join(kythe, 'tools/entrystream'), '--write_json'],
stdin=subprocess.PIPE,
stdout=open(temp_out_name, 'a'),
)
p.communicate(dedup_out)
if p.returncode:
raise Exception('entrystream failed with exit code {}'.format(p.returncode))
print('[INFO] Entrystream execution time:', (
datetime.datetime.now() - entrystream_start
).total_seconds(), 'seconds', file=sys.stderr)
preprocess_start = datetime.datetime.now()
subprocess.check_call(
[kythe_to_proto, '--preprocess-entry', '--entries', temp_out_name, '--out', out_name]
+ (['--only-binding-data'] if binding_only else [])
)
print('[INFO] Preprocessing execution time:', (
datetime.datetime.now() - preprocess_start
).total_seconds(), 'seconds', file=sys.stderr)
print('[INFO] Total execution time:', (datetime.datetime.now() - start).total_seconds(), 'seconds', file=sys.stderr)
if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument("--java", help="java path")
parser.add_argument("--kythe", help="kythe path")
parser.add_argument("--kythe-to-proto", help="kythe_to_proto tool path")
parser.add_argument("--out-name", help="entries json out name")
parser.add_argument("--binding-only", action="store_true", default=False, help="filter only binding data")
parser.add_argument("kindexes", nargs='*')
args = parser.parse_args()
just_do_it(args.java, args.kythe, args.kythe_to_proto, args.out_name, args.binding_only, args.kindexes)
|