diff options
author | Ian Kasprzak <iankaz@google.com> | 2020-12-23 10:08:20 -0800 |
---|---|---|
committer | Ian Kasprzak <iankaz@google.com> | 2021-01-06 17:49:41 +0000 |
commit | 30bc354e25cb5ccfbbb276a93ec54195e6b966a4 (patch) | |
tree | bf4e82ca88ade5a57b2fb1e46a6a8991c84f7b98 /git_trace2_event_log.py | |
parent | ce9b6c43b2394f3f8c9413abfa3a10597de54223 (diff) | |
download | git-repo-30bc354e25cb5ccfbbb276a93ec54195e6b966a4.tar.gz |
Enable git trace2 event format logging.
Ways to enable logging:
1) Set git's trace2.eventtarget config variable to desired logging path
2) Specify path via --git_trace2_event_log option
A unique logfile name is generated per repo execution (based on the repo session-id).
Testing:
1) Verified git config 'trace2.eventtarget' and flag enable logging.
2) Verified version/start/end events are expected format:
https://git-scm.com/docs/api-trace2#_event_format
3) Unit tests
Bug: https://crbug.com/gerrit/13706
Change-Id: I335eba68124055321c4149979bec36ac16ef81eb
Tested-by: Ian Kasprzak <iankaz@google.com>
Reviewed-on: https://gerrit-review.googlesource.com/c/git-repo/+/292262
Reviewed-by: Mike Frysinger <vapier@google.com>
Reviewed-by: Jonathan Nieder <jrn@google.com>
Diffstat (limited to 'git_trace2_event_log.py')
-rw-r--r-- | git_trace2_event_log.py | 197 |
1 files changed, 197 insertions, 0 deletions
diff --git a/git_trace2_event_log.py b/git_trace2_event_log.py new file mode 100644 index 00000000..4a8e0347 --- /dev/null +++ b/git_trace2_event_log.py | |||
@@ -0,0 +1,197 @@ | |||
1 | # Copyright (C) 2020 The Android Open Source Project | ||
2 | # | ||
3 | # Licensed under the Apache License, Version 2.0 (the "License"); | ||
4 | # you may not use this file except in compliance with the License. | ||
5 | # You may obtain a copy of the License at | ||
6 | # | ||
7 | # http://www.apache.org/licenses/LICENSE-2.0 | ||
8 | # | ||
9 | # Unless required by applicable law or agreed to in writing, software | ||
10 | # distributed under the License is distributed on an "AS IS" BASIS, | ||
11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
12 | # See the License for the specific language governing permissions and | ||
13 | # limitations under the License. | ||
14 | |||
15 | """Provide event logging in the git trace2 EVENT format. | ||
16 | |||
17 | The git trace2 EVENT format is defined at: | ||
18 | https://www.kernel.org/pub/software/scm/git/docs/technical/api-trace2.html#_event_format | ||
19 | https://git-scm.com/docs/api-trace2#_the_event_format_target | ||
20 | |||
21 | Usage: | ||
22 | |||
23 | git_trace_log = EventLog() | ||
24 | git_trace_log.StartEvent() | ||
25 | ... | ||
26 | git_trace_log.ExitEvent() | ||
27 | git_trace_log.Write() | ||
28 | """ | ||
29 | |||
30 | |||
31 | import datetime | ||
32 | import json | ||
33 | import os | ||
34 | import sys | ||
35 | import tempfile | ||
36 | import threading | ||
37 | |||
38 | from git_command import GitCommand, RepoSourceVersion | ||
39 | |||
40 | |||
41 | class EventLog(object): | ||
42 | """Event log that records events that occurred during a repo invocation. | ||
43 | |||
44 | Events are written to the log as a consecutive JSON entries, one per line. | ||
45 | Entries follow the git trace2 EVENT format. | ||
46 | |||
47 | Each entry contains the following common keys: | ||
48 | - event: The event name | ||
49 | - sid: session-id - Unique string to allow process instance to be identified. | ||
50 | - thread: The thread name. | ||
51 | - time: is the UTC time of the event. | ||
52 | |||
53 | Valid 'event' names and event specific fields are documented here: | ||
54 | https://git-scm.com/docs/api-trace2#_event_format | ||
55 | """ | ||
56 | |||
57 | def __init__(self, env=None): | ||
58 | """Initializes the event log.""" | ||
59 | self._log = [] | ||
60 | # Try to get session-id (sid) from environment (setup in repo launcher). | ||
61 | KEY = 'GIT_TRACE2_PARENT_SID' | ||
62 | if env is None: | ||
63 | env = os.environ | ||
64 | |||
65 | now = datetime.datetime.utcnow() | ||
66 | |||
67 | # Save both our sid component and the complete sid. | ||
68 | # We use our sid component (self._sid) as the unique filename prefix and | ||
69 | # the full sid (self._full_sid) in the log itself. | ||
70 | self._sid = 'repo-%s-P%08x' % (now.strftime('%Y%m%dT%H%M%SZ'), os.getpid()) | ||
71 | parent_sid = env.get(KEY) | ||
72 | # Append our sid component to the parent sid (if it exists). | ||
73 | if parent_sid is not None: | ||
74 | self._full_sid = parent_sid + '/' + self._sid | ||
75 | else: | ||
76 | self._full_sid = self._sid | ||
77 | |||
78 | # Set/update the environment variable. | ||
79 | # Environment handling across systems is messy. | ||
80 | try: | ||
81 | env[KEY] = self._full_sid | ||
82 | except UnicodeEncodeError: | ||
83 | env[KEY] = self._full_sid.encode() | ||
84 | |||
85 | # Add a version event to front of the log. | ||
86 | self._AddVersionEvent() | ||
87 | |||
88 | @property | ||
89 | def full_sid(self): | ||
90 | return self._full_sid | ||
91 | |||
92 | def _AddVersionEvent(self): | ||
93 | """Adds a 'version' event at the beginning of current log.""" | ||
94 | version_event = self._CreateEventDict('version') | ||
95 | version_event['evt'] = 2 | ||
96 | version_event['exe'] = RepoSourceVersion() | ||
97 | self._log.insert(0, version_event) | ||
98 | |||
99 | def _CreateEventDict(self, event_name): | ||
100 | """Returns a dictionary with the common keys/values for git trace2 events. | ||
101 | |||
102 | Args: | ||
103 | event_name: The event name. | ||
104 | |||
105 | Returns: | ||
106 | Dictionary with the common event fields populated. | ||
107 | """ | ||
108 | return { | ||
109 | 'event': event_name, | ||
110 | 'sid': self._full_sid, | ||
111 | 'thread': threading.currentThread().getName(), | ||
112 | 'time': datetime.datetime.utcnow().isoformat() + 'Z', | ||
113 | } | ||
114 | |||
115 | def StartEvent(self): | ||
116 | """Append a 'start' event to the current log.""" | ||
117 | start_event = self._CreateEventDict('start') | ||
118 | start_event['argv'] = sys.argv | ||
119 | self._log.append(start_event) | ||
120 | |||
121 | def ExitEvent(self, result): | ||
122 | """Append an 'exit' event to the current log. | ||
123 | |||
124 | Args: | ||
125 | result: Exit code of the event | ||
126 | """ | ||
127 | exit_event = self._CreateEventDict('exit') | ||
128 | |||
129 | # Consider 'None' success (consistent with event_log result handling). | ||
130 | if result is None: | ||
131 | result = 0 | ||
132 | exit_event['code'] = result | ||
133 | self._log.append(exit_event) | ||
134 | |||
135 | def Write(self, path=None): | ||
136 | """Writes the log out to a file. | ||
137 | |||
138 | Log is only written if 'path' or 'git config --get trace2.eventtarget' | ||
139 | provide a valid path to write logs to. | ||
140 | |||
141 | Logging filename format follows the git trace2 style of being a unique | ||
142 | (exclusive writable) file. | ||
143 | |||
144 | Args: | ||
145 | path: Path to where logs should be written. | ||
146 | |||
147 | Returns: | ||
148 | log_path: Path to the log file if log is written, otherwise None | ||
149 | """ | ||
150 | log_path = None | ||
151 | # If no logging path is specified, get the path from 'trace2.eventtarget'. | ||
152 | if path is None: | ||
153 | cmd = ['config', '--get', 'trace2.eventtarget'] | ||
154 | # TODO(https://crbug.com/gerrit/13706): Use GitConfig when it supports | ||
155 | # system git config variables. | ||
156 | p = GitCommand(None, cmd, capture_stdout=True, capture_stderr=True, | ||
157 | bare=True) | ||
158 | retval = p.Wait() | ||
159 | if retval == 0: | ||
160 | # Strip trailing carriage-return in path. | ||
161 | path = p.stdout.rstrip('\n') | ||
162 | elif retval != 1: | ||
163 | # `git config --get` is documented to produce an exit status of `1` if | ||
164 | # the requested variable is not present in the configuration. Report any | ||
165 | # other return value as an error. | ||
166 | print("repo: error: 'git config --get' call failed with return code: %r, stderr: %r" % ( | ||
167 | retval, p.stderr), file=sys.stderr) | ||
168 | |||
169 | if isinstance(path, str): | ||
170 | # Get absolute path. | ||
171 | path = os.path.abspath(os.path.expanduser(path)) | ||
172 | else: | ||
173 | raise TypeError('path: str required but got %s.' % type(path)) | ||
174 | |||
175 | # Git trace2 requires a directory to write log to. | ||
176 | |||
177 | # TODO(https://crbug.com/gerrit/13706): Support file (append) mode also. | ||
178 | if not os.path.isdir(path): | ||
179 | return None | ||
180 | # Use NamedTemporaryFile to generate a unique filename as required by git trace2. | ||
181 | try: | ||
182 | with tempfile.NamedTemporaryFile(mode='x', prefix=self._sid, dir=path, | ||
183 | delete=False) as f: | ||
184 | # TODO(https://crbug.com/gerrit/13706): Support writing events as they | ||
185 | # occur. | ||
186 | for e in self._log: | ||
187 | # Dump in compact encoding mode. | ||
188 | # See 'Compact encoding' in Python docs: | ||
189 | # https://docs.python.org/3/library/json.html#module-json | ||
190 | json.dump(e, f, indent=None, separators=(',', ':')) | ||
191 | f.write('\n') | ||
192 | log_path = f.name | ||
193 | except FileExistsError as err: | ||
194 | print('repo: warning: git trace2 logging failed: %r' % err, | ||
195 | file=sys.stderr) | ||
196 | return None | ||
197 | return log_path | ||