fix cmake
[lyx.git] / src / LaTeX.cpp
blob1910b1dc7a7c317f77f9549bad4d5109b86ad10c
1 /**
2 * \file LaTeX.cpp
3 * This file is part of LyX, the document processor.
4 * Licence details can be found in the file COPYING.
6 * \author Alfredo Braunstein
7 * \author Lars Gullik Bjønnes
8 * \author Jean-Marc Lasgouttes
9 * \author Angus Leeming
10 * \author Dekel Tsur
11 * \author Jürgen Spitzmüller
13 * Full author contact details are available in file CREDITS.
16 #include <config.h>
18 #include "BufferList.h"
19 #include "LaTeX.h"
20 #include "LyXRC.h"
21 #include "DepTable.h"
23 #include "support/debug.h"
24 #include "support/convert.h"
25 #include "support/FileName.h"
26 #include "support/filetools.h"
27 #include "support/gettext.h"
28 #include "support/lstrings.h"
29 #include "support/Systemcall.h"
30 #include "support/os.h"
32 #include <boost/regex.hpp>
34 #include <fstream>
36 using boost::regex;
37 using boost::smatch;
39 using namespace std;
40 using namespace lyx::support;
42 namespace lyx {
44 namespace os = support::os;
46 // TODO: in no particular order
47 // - get rid of the call to
48 // BufferList::updateIncludedTeXfiles, this should either
49 // be done before calling LaTeX::funcs or in a completely
50 // different way.
51 // - the makeindex style files should be taken care of with
52 // the dependency mechanism.
53 // - makeindex commandline options should be supported
54 // - somewhere support viewing of bibtex and makeindex log files.
55 // - we should perhaps also scan the bibtex log file
57 namespace {
59 docstring runMessage(unsigned int count)
61 return bformat(_("Waiting for LaTeX run number %1$d"), count);
64 } // anon namespace
67 * CLASS TEXERRORS
70 void TeXErrors::insertError(int line, docstring const & error_desc,
71 docstring const & error_text)
73 Error newerr(line, error_desc, error_text);
74 errors.push_back(newerr);
78 bool operator==(Aux_Info const & a, Aux_Info const & o)
80 return a.aux_file == o.aux_file &&
81 a.citations == o.citations &&
82 a.databases == o.databases &&
83 a.styles == o.styles;
87 bool operator!=(Aux_Info const & a, Aux_Info const & o)
89 return !(a == o);
94 * CLASS LaTeX
97 LaTeX::LaTeX(string const & latex, OutputParams const & rp,
98 FileName const & f)
99 : cmd(latex), file(f), runparams(rp)
101 num_errors = 0;
102 if (prefixIs(cmd, "pdf")) { // Do we use pdflatex ?
103 depfile = FileName(file.absFilename() + ".dep-pdf");
104 output_file =
105 FileName(changeExtension(file.absFilename(), ".pdf"));
106 } else {
107 depfile = FileName(file.absFilename() + ".dep");
108 output_file =
109 FileName(changeExtension(file.absFilename(), ".dvi"));
114 void LaTeX::deleteFilesOnError() const
116 // currently just a dummy function.
118 // What files do we have to delete?
120 // This will at least make latex do all the runs
121 depfile.removeFile();
123 // but the reason for the error might be in a generated file...
125 // bibtex file
126 FileName const bbl(changeExtension(file.absFilename(), ".bbl"));
127 bbl.removeFile();
129 // makeindex file
130 FileName const ind(changeExtension(file.absFilename(), ".ind"));
131 ind.removeFile();
133 // nomencl file
134 FileName const nls(changeExtension(file.absFilename(), ".nls"));
135 nls.removeFile();
137 // nomencl file (old version of the package)
138 FileName const gls(changeExtension(file.absFilename(), ".gls"));
139 gls.removeFile();
141 // Also remove the aux file
142 FileName const aux(changeExtension(file.absFilename(), ".aux"));
143 aux.removeFile();
147 int LaTeX::run(TeXErrors & terr)
148 // We know that this function will only be run if the lyx buffer
149 // has been changed. We also know that a newly written .tex file
150 // is always different from the previous one because of the date
151 // in it. However it seems safe to run latex (at least) on time
152 // each time the .tex file changes.
154 int scanres = NO_ERRORS;
155 unsigned int count = 0; // number of times run
156 num_errors = 0; // just to make sure.
157 unsigned int const MAX_RUN = 6;
158 DepTable head; // empty head
159 bool rerun = false; // rerun requested
161 // The class LaTeX does not know the temp path.
162 theBufferList().updateIncludedTeXfiles(FileName::getcwd().absFilename(),
163 runparams);
165 // Never write the depfile if an error was encountered.
167 // 0
168 // first check if the file dependencies exist:
169 // ->If it does exist
170 // check if any of the files mentioned in it have
171 // changed (done using a checksum).
172 // -> if changed:
173 // run latex once and
174 // remake the dependency file
175 // -> if not changed:
176 // just return there is nothing to do for us.
177 // ->if it doesn't exist
178 // make it and
179 // run latex once (we need to run latex once anyway) and
180 // remake the dependency file.
183 bool had_depfile = depfile.exists();
184 bool run_bibtex = false;
185 FileName const aux_file(changeExtension(file.absFilename(), "aux"));
187 if (had_depfile) {
188 LYXERR(Debug::DEPEND, "Dependency file exists");
189 // Read the dep file:
190 had_depfile = head.read(depfile);
193 if (had_depfile) {
194 // Update the checksums
195 head.update();
196 // Can't just check if anything has changed because it might
197 // have aborted on error last time... in which cas we need
198 // to re-run latex and collect the error messages
199 // (even if they are the same).
200 if (!output_file.exists()) {
201 LYXERR(Debug::DEPEND,
202 "re-running LaTeX because output file doesn't exist.");
203 } else if (!head.sumchange()) {
204 LYXERR(Debug::DEPEND, "return no_change");
205 return NO_CHANGE;
206 } else {
207 LYXERR(Debug::DEPEND, "Dependency file has changed");
210 if (head.extchanged(".bib") || head.extchanged(".bst"))
211 run_bibtex = true;
212 } else
213 LYXERR(Debug::DEPEND,
214 "Dependency file does not exist, or has wrong format");
216 /// We scan the aux file even when had_depfile = false,
217 /// because we can run pdflatex on the file after running latex on it,
218 /// in which case we will not need to run bibtex again.
219 vector<Aux_Info> bibtex_info_old;
220 if (!run_bibtex)
221 bibtex_info_old = scanAuxFiles(aux_file);
223 ++count;
224 LYXERR(Debug::LATEX, "Run #" << count);
225 message(runMessage(count));
227 startscript();
228 scanres = scanLogFile(terr);
229 if (scanres & ERROR_RERUN) {
230 LYXERR(Debug::LATEX, "Rerunning LaTeX");
231 startscript();
232 scanres = scanLogFile(terr);
235 if (scanres & ERRORS) {
236 deleteFilesOnError();
237 return scanres; // return on error
240 vector<Aux_Info> const bibtex_info = scanAuxFiles(aux_file);
241 if (!run_bibtex && bibtex_info_old != bibtex_info)
242 run_bibtex = true;
244 // update the dependencies.
245 deplog(head); // reads the latex log
246 head.update();
248 // 0.5
249 // At this point we must run external programs if needed.
250 // makeindex will be run if a .idx file changed or was generated.
251 // And if there were undefined citations or changes in references
252 // the .aux file is checked for signs of bibtex. Bibtex is then run
253 // if needed.
255 // memoir (at least) writes an empty *idx file in the first place.
256 // A second latex run is needed.
257 FileName const idxfile(changeExtension(file.absFilename(), ".idx"));
258 rerun = idxfile.exists() && idxfile.isFileEmpty();
260 // run makeindex
261 if (head.haschanged(idxfile)) {
262 // no checks for now
263 LYXERR(Debug::LATEX, "Running MakeIndex.");
264 message(_("Running MakeIndex."));
265 // onlyFilename() is needed for cygwin
266 rerun |= runMakeIndex(onlyFilename(idxfile.absFilename()),
267 runparams);
269 FileName const nlofile(changeExtension(file.absFilename(), ".nlo"));
270 if (head.haschanged(nlofile))
271 rerun |= runMakeIndexNomencl(file, runparams, ".nlo", ".nls");
272 FileName const glofile(changeExtension(file.absFilename(), ".glo"));
273 if (head.haschanged(glofile))
274 rerun |= runMakeIndexNomencl(file, runparams, ".glo", ".gls");
276 // run bibtex
277 // if (scanres & UNDEF_CIT || scanres & RERUN || run_bibtex)
278 if (scanres & UNDEF_CIT || run_bibtex) {
279 // Here we must scan the .aux file and look for
280 // "\bibdata" and/or "\bibstyle". If one of those
281 // tags is found -> run bibtex and set rerun = true;
282 // no checks for now
283 LYXERR(Debug::LATEX, "Running BibTeX.");
284 message(_("Running BibTeX."));
285 updateBibtexDependencies(head, bibtex_info);
286 rerun |= runBibTeX(bibtex_info);
287 } else if (!had_depfile) {
288 /// If we run pdflatex on the file after running latex on it,
289 /// then we do not need to run bibtex, but we do need to
290 /// insert the .bib and .bst files into the .dep-pdf file.
291 updateBibtexDependencies(head, bibtex_info);
294 // 1
295 // we know on this point that latex has been run once (or we just
296 // returned) and the question now is to decide if we need to run
297 // it any more. This is done by asking if any of the files in the
298 // dependency file has changed. (remember that the checksum for
299 // a given file is reported to have changed if it just was created)
300 // -> if changed or rerun == true:
301 // run latex once more and
302 // update the dependency structure
303 // -> if not changed:
304 // we does nothing at this point
306 if (rerun || head.sumchange()) {
307 rerun = false;
308 ++count;
309 LYXERR(Debug::DEPEND, "Dep. file has changed or rerun requested");
310 LYXERR(Debug::LATEX, "Run #" << count);
311 message(runMessage(count));
312 startscript();
313 scanres = scanLogFile(terr);
314 if (scanres & ERRORS) {
315 deleteFilesOnError();
316 return scanres; // return on error
319 // update the depedencies
320 deplog(head); // reads the latex log
321 head.update();
322 } else {
323 LYXERR(Debug::DEPEND, "Dep. file has NOT changed");
326 // 1.5
327 // The inclusion of files generated by external programs like
328 // makeindex or bibtex might have done changes to pagenumbering,
329 // etc. And because of this we must run the external programs
330 // again to make sure everything is redone correctly.
331 // Also there should be no need to run the external programs any
332 // more after this.
334 // run makeindex if the <file>.idx has changed or was generated.
335 if (head.haschanged(idxfile)) {
336 // no checks for now
337 LYXERR(Debug::LATEX, "Running MakeIndex.");
338 message(_("Running MakeIndex."));
339 // onlyFilename() is needed for cygwin
340 rerun = runMakeIndex(onlyFilename(changeExtension(
341 file.absFilename(), ".idx")), runparams);
344 // I am not pretty sure if need this twice.
345 if (head.haschanged(nlofile))
346 rerun |= runMakeIndexNomencl(file, runparams, ".nlo", ".nls");
347 if (head.haschanged(glofile))
348 rerun |= runMakeIndexNomencl(file, runparams, ".glo", ".gls");
350 // 2
351 // we will only run latex more if the log file asks for it.
352 // or if the sumchange() is true.
353 // -> rerun asked for:
354 // run latex and
355 // remake the dependency file
356 // goto 2 or return if max runs are reached.
357 // -> rerun not asked for:
358 // just return (fall out of bottom of func)
360 while ((head.sumchange() || rerun || (scanres & RERUN))
361 && count < MAX_RUN) {
362 // Yes rerun until message goes away, or until
363 // MAX_RUNS are reached.
364 rerun = false;
365 ++count;
366 LYXERR(Debug::LATEX, "Run #" << count);
367 message(runMessage(count));
368 startscript();
369 scanres = scanLogFile(terr);
370 if (scanres & ERRORS) {
371 deleteFilesOnError();
372 return scanres; // return on error
375 // keep this updated
376 head.update();
379 // Write the dependencies to file.
380 head.write(depfile);
381 LYXERR(Debug::LATEX, "Done.");
382 return scanres;
386 int LaTeX::startscript()
388 // onlyFilename() is needed for cygwin
389 string tmp = cmd + ' '
390 + quoteName(onlyFilename(file.toFilesystemEncoding()))
391 + " > " + os::nulldev();
392 Systemcall one;
393 return one.startscript(Systemcall::Wait, tmp);
397 bool LaTeX::runMakeIndex(string const & f, OutputParams const & runparams,
398 string const & params)
400 LYXERR(Debug::LATEX,
401 "idx file has been made, running makeindex on file " << f);
402 string tmp = lyxrc.index_command + ' ';
404 tmp = subst(tmp, "$$lang", runparams.document_language);
405 tmp += quoteName(f);
406 tmp += params;
407 Systemcall one;
408 one.startscript(Systemcall::Wait, tmp);
409 return true;
413 bool LaTeX::runMakeIndexNomencl(FileName const & file,
414 OutputParams const & runparams,
415 string const & nlo, string const & nls)
417 LYXERR(Debug::LATEX, "Running MakeIndex for nomencl.");
418 message(_("Running MakeIndex for nomencl."));
419 // onlyFilename() is needed for cygwin
420 string const nomenclstr = " -s nomencl.ist -o "
421 + onlyFilename(changeExtension(file.toFilesystemEncoding(), nls));
422 return runMakeIndex(
423 onlyFilename(changeExtension(file.absFilename(), nlo)),
424 runparams, nomenclstr);
428 vector<Aux_Info> const
429 LaTeX::scanAuxFiles(FileName const & file)
431 vector<Aux_Info> result;
433 result.push_back(scanAuxFile(file));
435 string const basename = removeExtension(file.absFilename());
436 for (int i = 1; i < 1000; ++i) {
437 FileName const file2(basename
438 + '.' + convert<string>(i)
439 + ".aux");
440 if (!file2.exists())
441 break;
442 result.push_back(scanAuxFile(file2));
444 return result;
448 Aux_Info const LaTeX::scanAuxFile(FileName const & file)
450 Aux_Info result;
451 result.aux_file = file;
452 scanAuxFile(file, result);
453 return result;
457 void LaTeX::scanAuxFile(FileName const & file, Aux_Info & aux_info)
459 LYXERR(Debug::LATEX, "Scanning aux file: " << file);
461 ifstream ifs(file.toFilesystemEncoding().c_str());
462 string token;
463 static regex const reg1("\\\\citation\\{([^}]+)\\}");
464 static regex const reg2("\\\\bibdata\\{([^}]+)\\}");
465 static regex const reg3("\\\\bibstyle\\{([^}]+)\\}");
466 static regex const reg4("\\\\@input\\{([^}]+)\\}");
468 while (getline(ifs, token)) {
469 token = rtrim(token, "\r");
470 smatch sub;
471 // FIXME UNICODE: We assume that citation keys and filenames
472 // in the aux file are in the file system encoding.
473 token = to_utf8(from_filesystem8bit(token));
474 if (regex_match(token, sub, reg1)) {
475 string data = sub.str(1);
476 while (!data.empty()) {
477 string citation;
478 data = split(data, citation, ',');
479 LYXERR(Debug::LATEX, "Citation: " << citation);
480 aux_info.citations.insert(citation);
482 } else if (regex_match(token, sub, reg2)) {
483 string data = sub.str(1);
484 // data is now all the bib files separated by ','
485 // get them one by one and pass them to the helper
486 while (!data.empty()) {
487 string database;
488 data = split(data, database, ',');
489 database = changeExtension(database, "bib");
490 LYXERR(Debug::LATEX, "BibTeX database: `" << database << '\'');
491 aux_info.databases.insert(database);
493 } else if (regex_match(token, sub, reg3)) {
494 string style = sub.str(1);
495 // token is now the style file
496 // pass it to the helper
497 style = changeExtension(style, "bst");
498 LYXERR(Debug::LATEX, "BibTeX style: `" << style << '\'');
499 aux_info.styles.insert(style);
500 } else if (regex_match(token, sub, reg4)) {
501 string const file2 = sub.str(1);
502 scanAuxFile(makeAbsPath(file2), aux_info);
508 void LaTeX::updateBibtexDependencies(DepTable & dep,
509 vector<Aux_Info> const & bibtex_info)
511 // Since a run of Bibtex mandates more latex runs it is ok to
512 // remove all ".bib" and ".bst" files.
513 dep.remove_files_with_extension(".bib");
514 dep.remove_files_with_extension(".bst");
515 //string aux = OnlyFilename(ChangeExtension(file, ".aux"));
517 for (vector<Aux_Info>::const_iterator it = bibtex_info.begin();
518 it != bibtex_info.end(); ++it) {
519 for (set<string>::const_iterator it2 = it->databases.begin();
520 it2 != it->databases.end(); ++it2) {
521 FileName const file = findtexfile(*it2, "bib");
522 if (!file.empty())
523 dep.insert(file, true);
526 for (set<string>::const_iterator it2 = it->styles.begin();
527 it2 != it->styles.end(); ++it2) {
528 FileName const file = findtexfile(*it2, "bst");
529 if (!file.empty())
530 dep.insert(file, true);
536 bool LaTeX::runBibTeX(vector<Aux_Info> const & bibtex_info)
538 bool result = false;
539 for (vector<Aux_Info>::const_iterator it = bibtex_info.begin();
540 it != bibtex_info.end(); ++it) {
541 if (it->databases.empty())
542 continue;
543 result = true;
545 string tmp = lyxrc.bibtex_command + " ";
546 // onlyFilename() is needed for cygwin
547 tmp += quoteName(onlyFilename(removeExtension(
548 it->aux_file.absFilename())));
549 Systemcall one;
550 one.startscript(Systemcall::Wait, tmp);
552 // Return whether bibtex was run
553 return result;
557 int LaTeX::scanLogFile(TeXErrors & terr)
559 int last_line = -1;
560 int line_count = 1;
561 int retval = NO_ERRORS;
562 string tmp =
563 onlyFilename(changeExtension(file.absFilename(), ".log"));
564 LYXERR(Debug::LATEX, "Log file: " << tmp);
565 FileName const fn = FileName(makeAbsPath(tmp));
566 ifstream ifs(fn.toFilesystemEncoding().c_str());
567 bool fle_style = false;
568 static regex file_line_error(".+\\.\\D+:[0-9]+: (.+)");
570 string token;
571 while (getline(ifs, token)) {
572 // MikTeX sometimes inserts \0 in the log file. They can't be
573 // removed directly with the existing string utility
574 // functions, so convert them first to \r, and remove all
575 // \r's afterwards, since we need to remove them anyway.
576 token = subst(token, '\0', '\r');
577 token = subst(token, "\r", "");
578 smatch sub;
580 LYXERR(Debug::LATEX, "Log line: " << token);
582 if (token.empty())
583 continue;
585 if (contains(token, "file:line:error style messages enabled"))
586 fle_style = true;
588 if (prefixIs(token, "LaTeX Warning:") ||
589 prefixIs(token, "! pdfTeX warning")) {
590 // Here shall we handle different
591 // types of warnings
592 retval |= LATEX_WARNING;
593 LYXERR(Debug::LATEX, "LaTeX Warning.");
594 if (contains(token, "Rerun to get cross-references")) {
595 retval |= RERUN;
596 LYXERR(Debug::LATEX, "We should rerun.");
597 // package clefval needs 2 latex runs before bibtex
598 } else if (contains(token, "Value of")
599 && contains(token, "on page")
600 && contains(token, "undefined")) {
601 retval |= ERROR_RERUN;
602 LYXERR(Debug::LATEX, "Force rerun.");
603 } else if (contains(token, "Citation")
604 && contains(token, "on page")
605 && contains(token, "undefined")) {
606 retval |= UNDEF_CIT;
608 } else if (prefixIs(token, "Package")) {
609 // Package warnings
610 retval |= PACKAGE_WARNING;
611 if (contains(token, "natbib Warning:")) {
612 // Natbib warnings
613 if (contains(token, "Citation")
614 && contains(token, "on page")
615 && contains(token, "undefined")) {
616 retval |= UNDEF_CIT;
618 } else if (contains(token, "run BibTeX")) {
619 retval |= UNDEF_CIT;
620 } else if (contains(token, "Rerun LaTeX") ||
621 contains(token, "Rerun to get")) {
622 // at least longtable.sty and bibtopic.sty
623 // might use this.
624 LYXERR(Debug::LATEX, "We should rerun.");
625 retval |= RERUN;
627 } else if (token[0] == '(') {
628 if (contains(token, "Rerun LaTeX") ||
629 contains(token, "Rerun to get")) {
630 // Used by natbib
631 LYXERR(Debug::LATEX, "We should rerun.");
632 retval |= RERUN;
634 } else if (prefixIs(token, "! ") ||
635 fle_style && regex_match(token, sub, file_line_error)) {
636 // Ok, we have something that looks like a TeX Error
637 // but what do we really have.
639 // Just get the error description:
640 string desc;
641 if (prefixIs(token, "! "))
642 desc = string(token, 2);
643 else if (fle_style)
644 desc = sub.str();
645 if (contains(token, "LaTeX Error:"))
646 retval |= LATEX_ERROR;
647 // get the next line
648 string tmp;
649 int count = 0;
650 do {
651 if (!getline(ifs, tmp))
652 break;
653 if (++count > 10)
654 break;
655 } while (!prefixIs(tmp, "l."));
656 if (prefixIs(tmp, "l.")) {
657 // we have a latex error
658 retval |= TEX_ERROR;
659 if (contains(desc,
660 "Package babel Error: You haven't defined the language") ||
661 contains(desc,
662 "Package babel Error: You haven't loaded the option"))
663 retval |= ERROR_RERUN;
664 // get the line number:
665 int line = 0;
666 sscanf(tmp.c_str(), "l.%d", &line);
667 // get the rest of the message:
668 string errstr(tmp, tmp.find(' '));
669 errstr += '\n';
670 getline(ifs, tmp);
671 while (!contains(errstr, "l.")
672 && !tmp.empty()
673 && !prefixIs(tmp, "! ")
674 && !contains(tmp, "(job aborted")) {
675 errstr += tmp;
676 errstr += "\n";
677 getline(ifs, tmp);
679 LYXERR(Debug::LATEX, "line: " << line << '\n'
680 << "Desc: " << desc << '\n' << "Text: " << errstr);
681 if (line == last_line)
682 ++line_count;
683 else {
684 line_count = 1;
685 last_line = line;
687 if (line_count <= 5) {
688 // FIXME UNICODE
689 // We have no idea what the encoding of
690 // the log file is.
691 // It seems that the output from the
692 // latex compiler itself is pure ASCII,
693 // but it can include bits from the
694 // document, so whatever encoding we
695 // assume here it can be wrong.
696 terr.insertError(line,
697 from_local8bit(desc),
698 from_local8bit(errstr));
699 ++num_errors;
702 } else {
703 // information messages, TeX warnings and other
704 // warnings we have not caught earlier.
705 if (prefixIs(token, "Overfull ")) {
706 retval |= TEX_WARNING;
707 } else if (prefixIs(token, "Underfull ")) {
708 retval |= TEX_WARNING;
709 } else if (contains(token, "Rerun to get citations")) {
710 // Natbib seems to use this.
711 retval |= UNDEF_CIT;
712 } else if (contains(token, "No pages of output")) {
713 // A dvi file was not created
714 retval |= NO_OUTPUT;
715 } else if (contains(token, "That makes 100 errors")) {
716 // More than 100 errors were reprted
717 retval |= TOO_MANY_ERRORS;
721 LYXERR(Debug::LATEX, "Log line: " << token);
722 return retval;
726 namespace {
728 bool insertIfExists(FileName const & absname, DepTable & head)
730 if (absname.exists() && !absname.isDirectory()) {
731 head.insert(absname, true);
732 return true;
734 return false;
738 bool handleFoundFile(string const & ff, DepTable & head)
740 // convert from native os path to unix path
741 string foundfile = os::internal_path(trim(ff));
743 LYXERR(Debug::DEPEND, "Found file: " << foundfile);
745 // Ok now we found a file.
746 // Now we should make sure that this is a file that we can
747 // access through the normal paths.
748 // We will not try any fancy search methods to
749 // find the file.
751 // (1) foundfile is an
752 // absolute path and should
753 // be inserted.
754 FileName absname(foundfile);
755 if (absname.isAbsolute()) {
756 LYXERR(Debug::DEPEND, "AbsolutePath file: " << foundfile);
757 // On initial insert we want to do the update at once
758 // since this file cannot be a file generated by
759 // the latex run.
760 if (!insertIfExists(absname, head)) {
761 // check for spaces
762 string strippedfile = foundfile;
763 while (contains(strippedfile, " ")) {
764 // files with spaces are often enclosed in quotation
765 // marks; those have to be removed
766 string unquoted = subst(strippedfile, "\"", "");
767 absname.set(unquoted);
768 if (insertIfExists(absname, head))
769 return true;
770 // strip off part after last space and try again
771 string tmp = strippedfile;
772 string const stripoff =
773 rsplit(tmp, strippedfile, ' ');
774 absname.set(strippedfile);
775 if (insertIfExists(absname, head))
776 return true;
781 string onlyfile = onlyFilename(foundfile);
782 absname = makeAbsPath(onlyfile);
784 // check for spaces
785 while (contains(foundfile, ' ')) {
786 if (absname.exists())
787 // everything o.k.
788 break;
789 else {
790 // files with spaces are often enclosed in quotation
791 // marks; those have to be removed
792 string unquoted = subst(foundfile, "\"", "");
793 absname = makeAbsPath(unquoted);
794 if (absname.exists())
795 break;
796 // strip off part after last space and try again
797 string strippedfile;
798 string const stripoff =
799 rsplit(foundfile, strippedfile, ' ');
800 foundfile = strippedfile;
801 onlyfile = onlyFilename(strippedfile);
802 absname = makeAbsPath(onlyfile);
806 // (2) foundfile is in the tmpdir
807 // insert it into head
808 if (absname.exists() && !absname.isDirectory()) {
809 // FIXME: This regex contained glo, but glo is used by the old
810 // version of nomencl.sty. Do we need to put it back?
811 static regex const unwanted("^.*\\.(aux|log|dvi|bbl|ind)$");
812 if (regex_match(onlyfile, unwanted)) {
813 LYXERR(Debug::DEPEND, "We don't want " << onlyfile
814 << " in the dep file");
815 } else if (suffixIs(onlyfile, ".tex")) {
816 // This is a tex file generated by LyX
817 // and latex is not likely to change this
818 // during its runs.
819 LYXERR(Debug::DEPEND, "Tmpdir TeX file: " << onlyfile);
820 head.insert(absname, true);
821 } else {
822 LYXERR(Debug::DEPEND, "In tmpdir file:" << onlyfile);
823 head.insert(absname);
825 return true;
826 } else {
827 LYXERR(Debug::DEPEND, "Not a file or we are unable to find it.");
828 return false;
833 bool checkLineBreak(string const & ff, DepTable & head)
835 if (!contains(ff, '.'))
836 return false;
838 // if we have a dot, we let handleFoundFile decide
839 return handleFoundFile(ff, head);
842 } // anon namespace
845 void LaTeX::deplog(DepTable & head)
847 // This function reads the LaTeX log file end extracts all the
848 // external files used by the LaTeX run. The files are then
849 // entered into the dependency file.
851 string const logfile =
852 onlyFilename(changeExtension(file.absFilename(), ".log"));
854 static regex const reg1("File: (.+).*");
855 static regex const reg2("No file (.+)(.).*");
856 static regex const reg3("\\\\openout[0-9]+.*=.*`(.+)(..).*");
857 // If an index should be created, MikTex does not write a line like
858 // \openout# = 'sample.idx'.
859 // but instead only a line like this into the log:
860 // Writing index file sample.idx
861 static regex const reg4("Writing index file (.+).*");
862 // files also can be enclosed in <...>
863 static regex const reg5("<([^>]+)(.).*");
864 static regex const regoldnomencl("Writing glossary file (.+).*");
865 static regex const regnomencl("Writing nomenclature file (.+).*");
866 // If a toc should be created, MikTex does not write a line like
867 // \openout# = `sample.toc'.
868 // but only a line like this into the log:
869 // \tf@toc=\write#
870 // This line is also written by tetex.
871 // This line is not present if no toc should be created.
872 static regex const miktexTocReg("\\\\tf@toc=\\\\write.*");
873 static regex const reg6(".*\\([^)]+.*");
875 FileName const fn = makeAbsPath(logfile);
876 ifstream ifs(fn.toFilesystemEncoding().c_str());
877 string lastline;
878 while (ifs) {
879 // Ok, the scanning of files here is not sufficient.
880 // Sometimes files are named by "File: xxx" only
881 // So I think we should use some regexps to find files instead.
882 // Note: all file names and paths might contains spaces.
883 bool found_file = false;
884 string token;
885 getline(ifs, token);
886 // MikTeX sometimes inserts \0 in the log file. They can't be
887 // removed directly with the existing string utility
888 // functions, so convert them first to \r, and remove all
889 // \r's afterwards, since we need to remove them anyway.
890 token = subst(token, '\0', '\r');
891 token = subst(token, "\r", "");
892 if (token.empty() || token == ")") {
893 lastline = string();
894 continue;
897 // Sometimes, filenames are broken across lines.
898 // We care for that and save suspicious lines.
899 // Here we exclude some cases where we are sure
900 // that there is no continued filename
901 if (!lastline.empty()) {
902 static regex const package_info("Package \\w+ Info: .*");
903 static regex const package_warning("Package \\w+ Warning: .*");
904 if (prefixIs(token, "File:") || prefixIs(token, "(Font)")
905 || prefixIs(token, "Package:")
906 || prefixIs(token, "Language:")
907 || prefixIs(token, "LaTeX Info:")
908 || prefixIs(token, "LaTeX Font Info:")
909 || prefixIs(token, "\\openout[")
910 || prefixIs(token, "))")
911 || regex_match(token, package_info)
912 || regex_match(token, package_warning))
913 lastline = string();
916 if (!lastline.empty())
917 // probably a continued filename from last line
918 token = lastline + token;
919 if (token.length() > 255) {
920 // string too long. Cut off.
921 token.erase(0, token.length() - 251);
924 smatch sub;
926 // FIXME UNICODE: We assume that the file names in the log
927 // file are in the file system encoding.
928 token = to_utf8(from_filesystem8bit(token));
930 // (1) "File: file.ext"
931 if (regex_match(token, sub, reg1)) {
932 // check for dot
933 found_file = checkLineBreak(sub.str(1), head);
934 // However, ...
935 if (suffixIs(token, ")"))
936 // no line break for sure
937 // pretend we've been succesfully searching
938 found_file = true;
939 // (2) "No file file.ext"
940 } else if (regex_match(token, sub, reg2)) {
941 // file names must contains a dot, line ends with dot
942 if (contains(sub.str(1), '.') && sub.str(2) == ".")
943 found_file = handleFoundFile(sub.str(1), head);
944 else
945 // we suspect a line break
946 found_file = false;
947 // (3) "\openout<nr> = `file.ext'."
948 } else if (regex_match(token, sub, reg3)) {
949 // search for closing '. at the end of the line
950 if (sub.str(2) == "\'.")
951 found_file = handleFoundFile(sub.str(1), head);
952 else
953 // probable line break
954 found_file = false;
955 // (4) "Writing index file file.ext"
956 } else if (regex_match(token, sub, reg4))
957 // check for dot
958 found_file = checkLineBreak(sub.str(1), head);
959 // (5) "<file.ext>"
960 else if (regex_match(token, sub, reg5)) {
961 // search for closing '>' and dot ('*.*>') at the eol
962 if (contains(sub.str(1), '.') && sub.str(2) == ">")
963 found_file = handleFoundFile(sub.str(1), head);
964 else
965 // probable line break
966 found_file = false;
967 // (6) "Writing nomenclature file file.ext"
968 } else if (regex_match(token, sub, regnomencl) ||
969 regex_match(token, sub, regoldnomencl))
970 // check for dot
971 found_file = checkLineBreak(sub.str(1), head);
972 // (7) "\tf@toc=\write<nr>" (for MikTeX)
973 else if (regex_match(token, sub, miktexTocReg))
974 found_file = handleFoundFile(onlyFilename(changeExtension(
975 file.absFilename(), ".toc")), head);
976 else
977 // not found, but we won't check further
978 // pretend we've been succesfully searching
979 found_file = true;
981 // (8) "(file.ext"
982 // note that we can have several of these on one line
983 // this must be queried separated, because of
984 // cases such as "File: file.ext (type eps)"
985 // where "File: file.ext" would be skipped
986 if (regex_match(token, sub, reg6)) {
987 // search for strings in (...)
988 static regex reg6_1("\\(([^()]+)(.).*");
989 smatch what;
990 string::const_iterator first = token.begin();
991 string::const_iterator end = token.end();
993 while (regex_search(first, end, what, reg6_1)) {
994 // if we have a dot, try to handle as file
995 if (contains(what.str(1), '.')) {
996 first = what[0].second;
997 if (what.str(2) == ")") {
998 handleFoundFile(what.str(1), head);
999 // since we had a closing bracket,
1000 // do not investigate further
1001 found_file = true;
1002 } else
1003 // if we have no closing bracket,
1004 // try to handle as file nevertheless
1005 found_file = handleFoundFile(
1006 what.str(1) + what.str(2), head);
1008 // if we do not have a dot, check if the line has
1009 // a closing bracket (else, we suspect a line break)
1010 else if (what.str(2) != ")") {
1011 first = what[0].second;
1012 found_file = false;
1013 } else {
1014 // we have a closing bracket, so the content
1015 // is not a file name.
1016 // no need to investigate further
1017 // pretend we've been succesfully searching
1018 first = what[0].second;
1019 found_file = true;
1024 if (!found_file)
1025 // probable linebreak:
1026 // save this line
1027 lastline = token;
1028 else
1029 // no linebreak: reset
1030 lastline = string();
1033 // Make sure that the main .tex file is in the dependency file.
1034 head.insert(file, true);
1038 } // namespace lyx