Ninja
deps_log.cc
Go to the documentation of this file.
1 // Copyright 2012 Google Inc. All Rights Reserved.
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 // http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 
15 #include "deps_log.h"
16 
17 #include <assert.h>
18 #include <stdio.h>
19 #include <errno.h>
20 #include <string.h>
21 #ifndef _WIN32
22 #include <unistd.h>
23 #endif
24 
25 #include "graph.h"
26 #include "metrics.h"
27 #include "state.h"
28 #include "util.h"
29 
30 // The version is stored as 4 bytes after the signature and also serves as a
31 // byte order mark. Signature and version combined are 16 bytes long.
32 const char kFileSignature[] = "# ninjadeps\n";
33 const int kCurrentVersion = 1;
34 
36  Close();
37 }
38 
39 bool DepsLog::OpenForWrite(const string& path, string* err) {
40  if (needs_recompaction_) {
41  Close();
42  if (!Recompact(path, err))
43  return false;
44  }
45 
46  file_ = fopen(path.c_str(), "ab");
47  if (!file_) {
48  *err = strerror(errno);
49  return false;
50  }
51  SetCloseOnExec(fileno(file_));
52 
53  // Opening a file in append mode doesn't set the file pointer to the file's
54  // end on Windows. Do that explicitly.
55  fseek(file_, 0, SEEK_END);
56 
57  if (ftell(file_) == 0) {
58  if (fwrite(kFileSignature, sizeof(kFileSignature) - 1, 1, file_) < 1) {
59  *err = strerror(errno);
60  return false;
61  }
62  if (fwrite(&kCurrentVersion, 4, 1, file_) < 1) {
63  *err = strerror(errno);
64  return false;
65  }
66  }
67 
68  return true;
69 }
70 
72  const vector<Node*>& nodes) {
73  return RecordDeps(node, mtime, nodes.size(),
74  nodes.empty() ? NULL : (Node**)&nodes.front());
75 }
76 
78  int node_count, Node** nodes) {
79  // Track whether there's any new data to be recorded.
80  bool made_change = false;
81 
82  // Assign ids to all nodes that are missing one.
83  if (node->id() < 0) {
84  RecordId(node);
85  made_change = true;
86  }
87  for (int i = 0; i < node_count; ++i) {
88  if (nodes[i]->id() < 0) {
89  RecordId(nodes[i]);
90  made_change = true;
91  }
92  }
93 
94  // See if the new data is different than the existing data, if any.
95  if (!made_change) {
96  Deps* deps = GetDeps(node);
97  if (!deps ||
98  deps->mtime != mtime ||
99  deps->node_count != node_count) {
100  made_change = true;
101  } else {
102  for (int i = 0; i < node_count; ++i) {
103  if (deps->nodes[i] != nodes[i]) {
104  made_change = true;
105  break;
106  }
107  }
108  }
109  }
110 
111  // Don't write anything if there's no new info.
112  if (!made_change)
113  return true;
114 
115  // Update on-disk representation.
116  uint16_t size = 4 * (1 + 1 + (uint16_t)node_count);
117  size |= 0x8000; // Deps record: set high bit.
118  fwrite(&size, 2, 1, file_);
119  int id = node->id();
120  fwrite(&id, 4, 1, file_);
121  int timestamp = mtime;
122  fwrite(&timestamp, 4, 1, file_);
123  for (int i = 0; i < node_count; ++i) {
124  id = nodes[i]->id();
125  fwrite(&id, 4, 1, file_);
126  }
127 
128  // Update in-memory representation.
129  Deps* deps = new Deps(mtime, node_count);
130  for (int i = 0; i < node_count; ++i)
131  deps->nodes[i] = nodes[i];
132  UpdateDeps(node->id(), deps);
133 
134  return true;
135 }
136 
138  if (file_)
139  fclose(file_);
140  file_ = NULL;
141 }
142 
143 bool DepsLog::Load(const string& path, State* state, string* err) {
144  METRIC_RECORD(".ninja_deps load");
145  char buf[32 << 10];
146  FILE* f = fopen(path.c_str(), "rb");
147  if (!f) {
148  if (errno == ENOENT)
149  return true;
150  *err = strerror(errno);
151  return false;
152  }
153 
154  bool valid_header = true;
155  int version = 0;
156  if (!fgets(buf, sizeof(buf), f) || fread(&version, 4, 1, f) < 1)
157  valid_header = false;
158  if (!valid_header || strcmp(buf, kFileSignature) != 0 ||
159  version != kCurrentVersion) {
160  *err = "bad deps log signature or version; starting over";
161  fclose(f);
162  unlink(path.c_str());
163  // Don't report this as a failure. An empty deps log will cause
164  // us to rebuild the outputs anyway.
165  return true;
166  }
167 
168  long offset;
169  bool read_failed = false;
170  int unique_dep_record_count = 0;
171  int total_dep_record_count = 0;
172  for (;;) {
173  offset = ftell(f);
174 
175  uint16_t size;
176  if (fread(&size, 2, 1, f) < 1) {
177  if (!feof(f))
178  read_failed = true;
179  break;
180  }
181  bool is_deps = (size >> 15) != 0;
182  size = size & 0x7FFF;
183 
184  if (fread(buf, size, 1, f) < 1) {
185  read_failed = true;
186  break;
187  }
188 
189  if (is_deps) {
190  assert(size % 4 == 0);
191  int* deps_data = reinterpret_cast<int*>(buf);
192  int out_id = deps_data[0];
193  int mtime = deps_data[1];
194  deps_data += 2;
195  int deps_count = (size / 4) - 2;
196 
197  Deps* deps = new Deps(mtime, deps_count);
198  for (int i = 0; i < deps_count; ++i) {
199  assert(deps_data[i] < (int)nodes_.size());
200  assert(nodes_[deps_data[i]]);
201  deps->nodes[i] = nodes_[deps_data[i]];
202  }
203 
204  total_dep_record_count++;
205  if (!UpdateDeps(out_id, deps))
206  ++unique_dep_record_count;
207  } else {
208  StringPiece path(buf, size);
209  Node* node = state->GetNode(path);
210  assert(node->id() < 0);
211  node->set_id(nodes_.size());
212  nodes_.push_back(node);
213  }
214  }
215 
216  if (read_failed) {
217  // An error occurred while loading; try to recover by truncating the
218  // file to the last fully-read record.
219  if (ferror(f)) {
220  *err = strerror(ferror(f));
221  } else {
222  *err = "premature end of file";
223  }
224  fclose(f);
225 
226  if (!Truncate(path.c_str(), offset, err))
227  return false;
228 
229  // The truncate succeeded; we'll just report the load error as a
230  // warning because the build can proceed.
231  *err += "; recovering";
232  return true;
233  }
234 
235  fclose(f);
236 
237  // Rebuild the log if there are too many dead records.
238  int kMinCompactionEntryCount = 1000;
239  int kCompactionRatio = 3;
240  if (total_dep_record_count > kMinCompactionEntryCount &&
241  total_dep_record_count > unique_dep_record_count * kCompactionRatio) {
242  needs_recompaction_ = true;
243  }
244 
245  return true;
246 }
247 
249  // Abort if the node has no id (never referenced in the deps) or if
250  // there's no deps recorded for the node.
251  if (node->id() < 0 || node->id() >= (int)deps_.size())
252  return NULL;
253  return deps_[node->id()];
254 }
255 
256 bool DepsLog::Recompact(const string& path, string* err) {
257  METRIC_RECORD(".ninja_deps recompact");
258  printf("Recompacting deps...\n");
259 
260  string temp_path = path + ".recompact";
261 
262  // OpenForWrite() opens for append. Make sure it's not appending to a
263  // left-over file from a previous recompaction attempt that crashed somehow.
264  unlink(temp_path.c_str());
265 
266  DepsLog new_log;
267  if (!new_log.OpenForWrite(temp_path, err))
268  return false;
269 
270  // Clear all known ids so that new ones can be reassigned. The new indices
271  // will refer to the ordering in new_log, not in the current log.
272  for (vector<Node*>::iterator i = nodes_.begin(); i != nodes_.end(); ++i)
273  (*i)->set_id(-1);
274 
275  // Write out all deps again.
276  for (int old_id = 0; old_id < (int)deps_.size(); ++old_id) {
277  Deps* deps = deps_[old_id];
278  if (!deps) continue; // If nodes_[old_id] is a leaf, it has no deps.
279 
280  if (!new_log.RecordDeps(nodes_[old_id], deps->mtime,
281  deps->node_count, deps->nodes)) {
282  new_log.Close();
283  return false;
284  }
285  }
286 
287  new_log.Close();
288 
289  // All nodes now have ids that refer to new_log, so steal its data.
290  deps_.swap(new_log.deps_);
291  nodes_.swap(new_log.nodes_);
292 
293  if (unlink(path.c_str()) < 0) {
294  *err = strerror(errno);
295  return false;
296  }
297 
298  if (rename(temp_path.c_str(), path.c_str()) < 0) {
299  *err = strerror(errno);
300  return false;
301  }
302 
303  return true;
304 }
305 
306 bool DepsLog::UpdateDeps(int out_id, Deps* deps) {
307  if (out_id >= (int)deps_.size())
308  deps_.resize(out_id + 1);
309 
310  bool delete_old = deps_[out_id] != NULL;
311  if (delete_old)
312  delete deps_[out_id];
313  deps_[out_id] = deps;
314  return delete_old;
315 }
316 
317 bool DepsLog::RecordId(Node* node) {
318  uint16_t size = (uint16_t)node->path().size();
319  fwrite(&size, 2, 1, file_);
320  fwrite(node->path().data(), node->path().size(), 1, file_);
321 
322  node->set_id(nodes_.size());
323  nodes_.push_back(node);
324 
325  return true;
326 }
const int kCurrentVersion
Definition: deps_log.cc:33
const char kFileSignature[]
Definition: deps_log.cc:32
vector< Deps * > deps_
Maps id -> deps of that id.
Definition: deps_log.h:105
Node * GetNode(StringPiece path)
Definition: state.cc:112
StringPiece represents a slice of a string whose memory is managed externally.
Definition: string_piece.h:27
Information about a node in the dependency graph: the file, whether it's dirty, mtime, etc.
Definition: graph.h:35
Node ** nodes
Definition: deps_log.h:80
int TimeStamp
Definition: timestamp.h:22
void SetCloseOnExec(int fd)
Mark a file descriptor to not be inherited on exec()s.
Definition: util.cc:200
As build commands run they can output extra dependency information (e.g.
Definition: deps_log.h:63
vector< Node * > nodes_
Maps id -> Node.
Definition: deps_log.h:103
bool OpenForWrite(const string &path, string *err)
Definition: deps_log.cc:39
void set_id(int id)
Definition: graph.h:84
Deps * GetDeps(Node *node)
Definition: deps_log.cc:248
int node_count
Definition: deps_log.h:79
bool Load(const string &path, State *state, string *err)
Definition: deps_log.cc:143
bool Recompact(const string &path, string *err)
Rewrite the known log entries, throwing away old data.
Definition: deps_log.cc:256
bool needs_recompaction_
Definition: deps_log.h:99
bool RecordId(Node *node)
Definition: deps_log.cc:317
#define METRIC_RECORD(name)
The primary interface to metrics.
Definition: metrics.h:85
const string & path() const
Definition: graph.h:73
void Close()
Definition: deps_log.cc:137
int id() const
Definition: graph.h:83
FILE * file_
Definition: deps_log.h:100
bool Truncate(const string &path, size_t size, string *err)
Truncates a file to the given size.
Definition: util.cc:363
~DepsLog()
Definition: deps_log.cc:35
unsigned short uint16_t
Definition: win32port.h:19
const vector< Deps * > & deps() const
Definition: deps_log.h:90
Global state (file status, loaded rules) for a single run.
Definition: state.h:83
bool RecordDeps(Node *node, TimeStamp mtime, const vector< Node * > &nodes)
Definition: deps_log.cc:71
bool UpdateDeps(int out_id, Deps *deps)
Definition: deps_log.cc:306