Doxygen
Loading...
Searching...
No Matches
cite.cpp
Go to the documentation of this file.
1/******************************************************************************
2 *
3 * Copyright (C) 2020 by Dimitri van Heesch
4 * Based on a patch by David Munger
5 *
6 * Permission to use, copy, modify, and distribute this software and its
7 * documentation under the terms of the GNU General Public License is hereby
8 * granted. No representations are made about the suitability of this software
9 * for any purpose. It is provided "as is" without express or implied warranty.
10 * See the GNU General Public License for more details.
11 *
12 * Documents produced by Doxygen are derivative works derived from the
13 * input used in their production; they are not affected by this license.
14 *
15 */
16
17#include "cite.h"
18#include "config.h"
19#include "language.h"
20#include "message.h"
21#include "portable.h"
22#include "resourcemgr.h"
23#include "util.h"
24#include "debug.h"
25#include "fileinfo.h"
26#include "dir.h"
27#include "entry.h"
28#include "commentscan.h"
29#include "linkedmap.h"
30
31#include <map>
32#include <unordered_map>
33#include <string>
34#include <fstream>
35
36const char *bibTmpFile = "bibTmpFile_";
37const char *bibTmpDir = "bibTmpDir/";
38
39//! class that provide information about the p[osition of a citation name
41{
42 public:
43 CitePosition(const QCString &fn, int l) : fileName(fn), lineNr(l) {}
44
46 int lineNr;
47};
48
49static QCString getBibFile(const QCString &inFile)
50{
51 QCString name = inFile;
52 if (!name.isEmpty() && !name.endsWith(".bib")) name+=".bib";
53 return name;
54}
55
56class CiteInfoImpl : public CiteInfo
57{
58 public:
61
62 QCString label() const override { return m_label; }
63 QCString text() const override { return m_text; }
64 QCString shortAuthor() const override { return m_shortAuthor; }
65 QCString year() const override { return m_year; }
66
67 void setText(const QCString &s) { m_text = s; }
68 void setShortAuthor(const QCString &s) { m_shortAuthor = s; }
69 void setYear(const QCString &s) { m_year = s; }
70
71 private:
76};
77
79{
80 std::map< std::string,std::unique_ptr<CiteInfoImpl> > entries;
81 std::unordered_map< int,std::string > formulaCite;
82 std::unordered_map< std::string, CitePosition > citePosition;
83};
84
86{
87 static CitationManager ct;
88 return ct;
89}
90
94
96{
97 QCString lowerCaseLabel = label.lower();
98 p->entries.emplace(lowerCaseLabel.str(),std::make_unique<CiteInfoImpl>(lowerCaseLabel));
99}
100
101const CiteInfo *CitationManager::find(const QCString &label) const
102{
103 if (auto it = p->entries.find(label.lower().str()); it != p->entries.end())
104 {
105 return it->second.get();
106 }
107 return nullptr;
108}
109
111{
112 p->entries.clear();
113}
114
116{
117 size_t numFiles = Config_getList(CITE_BIB_FILES).size();
118 return (numFiles==0 || p->entries.empty());
119}
120
122{
123 return "citelist";
124}
125
127{
128 return "CITEREF_";
129}
130
132{
133 // sanity checks
134 if (bibFile.isEmpty())
135 {
136 return;
137 }
138 FileInfo fi(bibFile.str());
139 if (!fi.exists())
140 {
141 err("bib file {} not found!\n",bibFile);
142 return;
143 }
144 std::ifstream f = Portable::openInputStream(bibFile);
145 if (!f.is_open())
146 {
147 err("could not open file {} for reading\n",bibFile);
148 return;
149 }
150
151 // search for citation cross references
152 QCString citeName;
153
154 std::string lineStr;
155 int lineCount = 0;
156 while (getline(f,lineStr))
157 {
158 int i = -1;
159 QCString line(lineStr);
160 lineCount++;
161 if (line.stripWhiteSpace().startsWith("@"))
162 {
163 // assumption entry like: "@book { name," or "@book { name" (spaces optional)
164 int j = line.find('{');
165 // when no {, go hunting for it
166 while (j==-1 && getline(f,lineStr))
167 {
168 line = lineStr;
169 lineCount++;
170 j = line.find('{');
171 }
172 // search for the name
173 citeName = "";
174 if (!f.eof() && j!=-1) // to prevent something like "@manual ," and no { found
175 {
176 int k = line.find(',',j);
177 j++;
178 // found a line "@....{.....,...." or "@.....{....."
179 // ^=j ^=k ^=j k=-1
180 while (!f.eof() && citeName.isEmpty())
181 {
182 if (k!=-1)
183 {
184 citeName = line.mid(static_cast<size_t>(j),static_cast<size_t>(k-j));
185 }
186 else
187 {
188 citeName = line.mid(static_cast<size_t>(j));
189 }
190 citeName = citeName.stripWhiteSpace();
191 j = 0;
192 if (citeName.isEmpty() && getline(f,lineStr))
193 {
194 line = lineStr;
195 lineCount++;
196 k = line.find(',');
197 }
198 }
199 }
200 //printf("citeName = #%s#\n",qPrint(citeName));
201 if (!citeName.isEmpty())
202 {
203 std::string lCiteName = citeName.lower().str();
204 auto it = p->citePosition.find(lCiteName);
205 if (it != p->citePosition.end())
206 {
207 warn(bibFile,lineCount,"multiple use of citation name '{}', (first occurrence: {}, line {})",
208 lCiteName,it->second.fileName,it->second.lineNr);
209 }
210 else
211 {
212 p->citePosition.emplace(lCiteName,CitePosition(bibFile,lineCount));
213 }
214 }
215 }
216 else if ((i=line.find("crossref"))!=-1 && !citeName.isEmpty()) /* assumption cross reference is on one line and the only item */
217 {
218 int j = line.find('{',i);
219 int k = line.find('}',i);
220 if (j>i && k>j)
221 {
222 QCString crossrefName = line.mid(static_cast<size_t>(j+1),static_cast<uint32_t>(k-j-1));
223 // check if the reference with the cross reference is used
224 // insert cross reference when cross reference has not yet been added.
225 if (find(citeName) && !find(crossrefName)) // not found yet
226 {
227 insert(crossrefName);
228 }
229 }
230 }
231 }
232}
233
234static const std::string g_formulaMarker = "CITE_FORMULA_";
235
237{
238 if (s.isEmpty()) return s;
239 QCString result;
240 result.reserve(s.length()+32);
241 QCString formula;
242 formula.reserve(256);
243 bool insideFormula = false;
244 int citeFormulaCnt = 1;
245 const char *ps=s.data();
246 char c = 0;
247 while ((c=*ps++))
248 {
249 if (insideFormula)
250 {
251 switch (c)
252 {
253 case '\\':
254 formula+=c;
255 c = *ps++;
256 formula+=c;
257 break;
258 case '\n':
259 formula+=c;
260 result+='$';
261 result+=formula;
262 insideFormula = false;
263 formula.clear();
264 break;
265 case '$':
266 {
267 const size_t idLen = 30;
268 char id[idLen];
269 qsnprintf(id,idLen,"%s%06d",g_formulaMarker.c_str(),citeFormulaCnt);
270 p->formulaCite.emplace(citeFormulaCnt,std::string("\\f$") + formula.str() + "\\f$");
271 citeFormulaCnt++;
272 // need { and } due to the capitalization rules of bibtex.
273 result+='{';
274 result+=id;
275 result+='}';
276 insideFormula = false;
277 formula.clear();
278 }
279 break;
280 default:
281 formula+=c;
282 break;
283 }
284 }
285 else
286 {
287 switch (c)
288 {
289 case '\\':
290 result+=c;
291 c = *ps++;
292 result+=c;
293 break;
294 case '$':
295 insideFormula = true;
296 break;
297 default:
298 result+=c;
299 break;
300 }
301 }
302 }
303 if (insideFormula)
304 {
305 result+=formula;
306 formula.clear();
307 }
308 return result;
309}
310
312{
313 if (s.isEmpty()) return s;
314 QCString t;
315 int pos=0;
316 int i = -1;
317 while ((i=s.find(g_formulaMarker,pos))!=-1)
318 {
319 t += s.mid(pos,i-pos);
320 int markerSize = static_cast<int>( g_formulaMarker.length());
321 int markerId = atoi(s.mid(i+markerSize,6).data());
322 auto it = p->formulaCite.find(markerId);
323 if (it != p->formulaCite.end()) t += it->second;
324 pos = i + markerSize+6;
325 }
326 t += s.mid(pos);
327 //printf("replaceFormulas(%s)=%s\n",qPrint(s),qPrint(t));
328 return t;
329}
330
332{
333 //printf("** CitationManager::generatePage() count=%d\n",m_ordering.count());
334
335 // do not generate an empty citations page
336 if (isEmpty()) return; // nothing to cite
337
338 bool citeDebug = Debug::isFlagSet(Debug::Cite);
339
340 // 0. add cross references from the bib files to the cite dictionary
341 const StringVector &citeDataList = Config_getList(CITE_BIB_FILES);
342 for (const auto &bibdata : citeDataList)
343 {
344 QCString bibFile = getBibFile(bibdata);
346 }
347
348 // 1. generate file with markers and citations to OUTPUT_DIRECTORY
349 QCString outputDir = Config_getString(OUTPUT_DIRECTORY);
350 QCString citeListFile = outputDir+"/citelist.doc";
351 {
352 std::ofstream t = Portable::openOutputStream(citeListFile);
353 if (!t.is_open())
354 {
355 err("could not open file {} for writing\n",citeListFile);
356 }
357 t << "<!-- BEGIN CITATIONS -->\n";
358 t << "<!--\n";
359 for (const auto &it : p->entries)
360 {
361 t << "\\citation{" << it.second->label() << "}\n";
362 }
363 t << "-->\n";
364 t << "<!-- END CITATIONS -->\n";
365 t << "<!-- BEGIN BIBLIOGRAPHY -->\n";
366 t << "<!-- END BIBLIOGRAPHY -->\n";
367 t.close();
368 }
369
370 // 2. generate bib2xhtml
371 QCString bib2xhtmlFile = outputDir+"/bib2xhtml.pl";
372 ResourceMgr::instance().copyResource("bib2xhtml.pl",outputDir);
373
374 // 3. generate doxygen.bst
375 QCString doxygenBstFile = outputDir+"/doxygen.bst";
376 ResourceMgr::instance().copyResource("doxygen.bst",outputDir);
377
378 // 4. for all formats we just copy the bib files to as special output directory
379 // so bibtex can find them without path (bibtex doesn't support paths or
380 // filenames with spaces!)
381 // Strictly not required when only latex is generated
382 QCString bibOutputDir = outputDir+"/"+bibTmpDir;
383 QCString bibOutputFiles = "";
384 Dir thisDir;
385 if (!thisDir.exists(bibOutputDir.str()) && !thisDir.mkdir(bibOutputDir.str()))
386 {
387 err("Failed to create temporary output directory '{}', skipping citations\n",bibOutputDir);
388 return;
389 }
390 int i = 0;
391 for (const auto &bibdata : citeDataList)
392 {
393 QCString bibFile = getBibFile(bibdata);
394 FileInfo fi(bibFile.str());
395 if (fi.exists())
396 {
397 if (!bibFile.isEmpty())
398 {
399 ++i;
400 std::ifstream f_org = Portable::openInputStream(bibFile);
401 if (!f_org.is_open())
402 {
403 err("could not open file {} for reading\n",bibFile);
404 }
405 std::ofstream f_out = Portable::openOutputStream(bibOutputDir + bibTmpFile + QCString().setNum(i) + ".bib");
406 if (!f_out.is_open())
407 {
408 err("could not open file {}{}{:d}{} for reading\n",bibOutputDir,bibTmpFile,i,".bib");
409 }
410 QCString docs;
411 std::string lineStr;
412 while (getline(f_org,lineStr))
413 {
414 docs += lineStr + "\n";
415 }
416 docs = getFormulas(docs);
417 f_out << docs;
418 if (f_org.is_open()) f_org.close();
419 if (f_out.is_open()) f_out.close();
420 bibOutputFiles = bibOutputFiles + " " + bibTmpDir + bibTmpFile + QCString().setNum(i) + ".bib";
421 }
422 }
423 }
424
425 std::string oldDir = Dir::currentDirPath();
426 Dir::setCurrent(outputDir.str());
427
428 // 5. run bib2xhtml perl script on the generated file which will insert the
429 // bibliography in citelist.doc
430 QCString perlArgs = "\""+bib2xhtmlFile+"\" "+bibOutputFiles+" \""+ citeListFile+"\"";
431 if (citeDebug) perlArgs+=" -d";
432 int exitCode = Portable::system("perl",perlArgs);
433 if (exitCode!=0)
434 {
435 err("Problems running bibtex. Verify that the command 'perl --version' works from the command line. Exit code: {}\n",
436 exitCode);
437 }
438
439 Dir::setCurrent(oldDir);
440
441 // 6. read back the file
442 QCString doc;
443 {
444 std::ifstream f = Portable::openInputStream(citeListFile);
445 if (!f.is_open())
446 {
447 err("could not open file {} for reading\n",citeListFile);
448 }
449
450 bool insideBib=FALSE;
451 //printf("input=[%s]\n",qPrint(input));
452 std::string lineStr;
453 while (getline(f,lineStr))
454 {
455 QCString line(lineStr);
456 //printf("pos=%d s=%d line=[%s]\n",pos,s,qPrint(line));
457
458 if (line.find("<!-- BEGIN BIBLIOGRAPHY")!=-1) insideBib=TRUE;
459 else if (line.find("<!-- END BIBLIOGRAPH")!=-1) insideBib=FALSE;
460 // determine text to use at the location of the @cite command
461 if (insideBib && ((i=line.find("name=\"CITEREF_"))!=-1 || (i=line.find("name=\"#CITEREF_"))!=-1))
462 {
463 int j=line.find("\">[");
464 int j1=line.find("<!--[");
465 int k=line.find("]<!--");
466 int k1=line.find("]-->");
467 if (j!=-1 && k!=-1)
468 {
469 size_t ui=static_cast<size_t>(i);
470 size_t uj0=static_cast<size_t>(j);
471 size_t uj=static_cast<size_t>(j1);
472 size_t uk=static_cast<size_t>(k1);
473 QCString label = line.mid(ui+14,uj0-ui-14);
474 StringVector optList = split(line.mid(uj+5,uk-uj-5).str(),",");
475 QCString number = optList[0];
476 QCString shortAuthor = optList[1];
477 QCString year;
478 if (optList.size() == 3)
479 {
480 year = optList[2];
481 }
482 line = line.left(ui+14) + label + line.right(line.length()-uj0);
483 auto it = p->entries.find(label.lower().str());
484 //printf("label='%s' number='%s' => %p\n",qPrint(label),qPrint(number),it->second.get());
485 if (it!=p->entries.end())
486 {
487 it->second->setText(number);
488 it->second->setShortAuthor(shortAuthor);
489 it->second->setYear(year.stripWhiteSpace());
490 }
491 }
492 }
493 if (insideBib) doc+=line+"\n";
494 }
495 //printf("doc=[%s]\n",qPrint(doc));
496 }
497
498 // 7. place formulas back and run the conversion of \f$ ... \f$ to the internal required format
499 {
500 doc = replaceFormulas(doc);
501 Entry current;
502 bool needsEntry = false;
503 CommentScanner commentScanner;
504 int lineNr = 0;
505 int pos = 0;
506 GuardedSectionStack guards;
507 Protection prot = Protection::Public;
508 commentScanner.parseCommentBlock(
509 nullptr,
510 &current,
511 doc, // text
512 fileName(), // file
513 lineNr, // line of block start
514 false, // isBrief
515 false, // isJavaDocStyle
516 false, // isInBody
517 prot, // protection
518 pos, // position,
519 needsEntry,
520 false,
521 &guards
522 );
523 doc = current.doc;
524 }
525
526 // 8. add it as a page
527 addRelatedPage(fileName(),theTranslator->trCiteReferences(),doc,fileName(),1,1);
528
529 // 9. for latex we just copy the bib files to the output and let
530 // latex do this work.
531 if (Config_getBool(GENERATE_LATEX))
532 {
533 // copy bib files to the latex output dir
534 QCString latexOutputDir = Config_getString(LATEX_OUTPUT)+"/";
535 i = 0;
536 for (const auto &bibdata : citeDataList)
537 {
538 QCString bibFile = getBibFile(bibdata);
539 FileInfo fi(bibFile.str());
540 if (fi.exists())
541 {
542 if (!bibFile.isEmpty())
543 {
544 // bug_700510, multiple times the same name were overwriting; creating new names
545 // also for names with spaces
546 ++i;
547 copyFile(bibFile,latexOutputDir + bibTmpFile + QCString().setNum(i) + ".bib");
548 }
549 }
550 else
551 {
552 err("bib file {} not found!\n",bibFile);
553 }
554 }
555 }
556
557 // 10. Remove temporary files
558 if (!citeDebug)
559 {
560 thisDir.remove(citeListFile.str());
561 thisDir.remove(doxygenBstFile.str());
562 thisDir.remove(bib2xhtmlFile.str());
563 // we might try to remove too many files as empty files didn't get a corresponding new file
564 // but the remove function does not emit an error for it and we don't catch the error return
565 // so no problem.
566 for (size_t j = 1; j <= citeDataList.size(); j++)
567 {
568 QCString bibFile = bibOutputDir + bibTmpFile + QCString().setNum(static_cast<int>(j)) + ".bib";
569 thisDir.remove(bibFile.str());
570 }
571 thisDir.rmdir(bibOutputDir.str());
572 }
573}
574
576{
577 QCString result;
578 const StringVector &citeDataList = Config_getList(CITE_BIB_FILES);
579 int i = 0;
580 for (const auto &bibdata : citeDataList)
581 {
582 QCString bibFile = getBibFile(bibdata);
583 FileInfo fi(bibFile.str());
584 if (fi.exists() && !bibFile.isEmpty())
585 {
586 if (i) result += ",";
587 i++;
588 result += bibTmpFile;
589 result += QCString().setNum(i);
590 }
591 }
592 return result;
593}
static QCString getBibFile(const QCString &inFile)
Definition cite.cpp:49
static const std::string g_formulaMarker
Definition cite.cpp:234
const char * bibTmpFile
Definition cite.cpp:36
const char * bibTmpDir
Definition cite.cpp:37
void insertCrossReferencesForBibFile(const QCString &bibFile)
Definition cite.cpp:131
QCString anchorPrefix() const
Definition cite.cpp:126
std::unique_ptr< Private > p
Definition cite.h:123
const CiteInfo * find(const QCString &label) const
Return the citation info for a given label.
Definition cite.cpp:101
QCString latexBibFiles()
lists the bibtex cite files in a comma separated list
Definition cite.cpp:575
static CitationManager & instance()
Definition cite.cpp:85
void clear()
clears the database
Definition cite.cpp:110
QCString replaceFormulas(const QCString &s)
Definition cite.cpp:311
void insert(const QCString &label)
Insert a citation identified by label into the database.
Definition cite.cpp:95
CitationManager()
Create the database, with an expected maximum of size entries.
Definition cite.cpp:91
QCString fileName() const
Definition cite.cpp:121
bool isEmpty() const
return TRUE if there are no citations.
Definition cite.cpp:115
void generatePage()
Generate the citations page.
Definition cite.cpp:331
QCString getFormulas(const QCString &s)
Definition cite.cpp:236
void setText(const QCString &s)
Definition cite.cpp:67
QCString m_label
Definition cite.cpp:72
QCString label() const override
Definition cite.cpp:62
QCString text() const override
Definition cite.cpp:63
QCString m_shortAuthor
Definition cite.cpp:74
QCString year() const override
Definition cite.cpp:65
QCString m_text
Definition cite.cpp:73
QCString m_year
Definition cite.cpp:75
CiteInfoImpl(const QCString &label, const QCString &text=QCString())
Definition cite.cpp:59
QCString shortAuthor() const override
Definition cite.cpp:64
void setYear(const QCString &s)
Definition cite.cpp:69
void setShortAuthor(const QCString &s)
Definition cite.cpp:68
class that provide information about the p[osition of a citation name
Definition cite.cpp:41
QCString fileName
Definition cite.cpp:45
CitePosition(const QCString &fn, int l)
Definition cite.cpp:43
int lineNr
Definition cite.cpp:46
bool parseCommentBlock(OutlineParserInterface *parser, Entry *curEntry, const QCString &comment, const QCString &fileName, int &lineNr, bool isBrief, bool isJavadocStyle, bool isInbody, Protection &prot, int &position, bool &newEntryNeeded, bool markdownEnabled, GuardedSectionStack *guards)
Invokes the comment block parser with the request to parse a single comment block.
@ Cite
Definition debug.h:41
static bool isFlagSet(const DebugMask mask)
Definition debug.cpp:132
Class representing a directory in the file system.
Definition dir.h:75
static std::string currentDirPath()
Definition dir.cpp:342
bool mkdir(const std::string &path, bool acceptsAbsPath=true) const
Definition dir.cpp:295
bool remove(const std::string &path, bool acceptsAbsPath=true) const
Definition dir.cpp:314
bool rmdir(const std::string &path, bool acceptsAbsPath=true) const
Definition dir.cpp:309
static bool setCurrent(const std::string &path)
Definition dir.cpp:350
bool exists() const
Definition dir.cpp:257
Represents an unstructured piece of information, about an entity found in the sources.
Definition entry.h:116
QCString doc
documentation block (partly parsed)
Definition entry.h:200
Minimal replacement for QFileInfo.
Definition fileinfo.h:23
bool exists() const
Definition fileinfo.cpp:30
This is an alternative implementation of QCString.
Definition qcstring.h:101
int find(char c, int index=0, bool cs=TRUE) const
Definition qcstring.cpp:43
size_t length() const
Returns the length of the string, not counting the 0-terminator.
Definition qcstring.h:166
bool startsWith(const char *s) const
Definition qcstring.h:507
QCString mid(size_t index, size_t len=static_cast< size_t >(-1)) const
Definition qcstring.h:241
QCString lower() const
Definition qcstring.h:249
bool endsWith(const char *s) const
Definition qcstring.h:524
bool isEmpty() const
Returns TRUE iff the string is empty.
Definition qcstring.h:163
QCString stripWhiteSpace() const
returns a copy of this string with leading and trailing whitespace removed
Definition qcstring.h:260
const std::string & str() const
Definition qcstring.h:552
QCString & setNum(short n)
Definition qcstring.h:459
QCString right(size_t len) const
Definition qcstring.h:234
void reserve(size_t size)
Reserve space for size bytes without changing the string contents.
Definition qcstring.h:185
const char * data() const
Returns a pointer to the contents of the string in the form of a 0-terminated C string.
Definition qcstring.h:172
QCString left(size_t len) const
Definition qcstring.h:229
void clear()
Definition qcstring.h:182
static ResourceMgr & instance()
Returns the one and only instance of this class.
bool copyResource(const QCString &name, const QCString &targetDir) const
Copies a registered resource to a given target directory.
Interface for the comment block scanner.
std::stack< GuardedSection > GuardedSectionStack
Definition commentscan.h:48
#define Config_getList(name)
Definition config.h:38
#define Config_getBool(name)
Definition config.h:33
#define Config_getString(name)
Definition config.h:32
std::vector< std::string > StringVector
Definition containers.h:33
#define lineCount(s, len)
static void addRelatedPage(Entry *root)
Definition doxygen.cpp:328
Translator * theTranslator
Definition language.cpp:71
#define warn(file, line, fmt,...)
Definition message.h:97
#define err(fmt,...)
Definition message.h:127
std::ifstream openInputStream(const QCString &name, bool binary=false, bool openAtEnd=false)
Definition portable.cpp:660
std::ofstream openOutputStream(const QCString &name, bool append=false)
Definition portable.cpp:649
int system(const QCString &command, const QCString &args, bool commandHasConsole=true)
Definition portable.cpp:106
Portable versions of functions that are platform dependent.
#define qsnprintf
Definition qcstring.h:49
#define TRUE
Definition qcstring.h:37
#define FALSE
Definition qcstring.h:34
std::map< std::string, std::unique_ptr< CiteInfoImpl > > entries
Definition cite.cpp:80
std::unordered_map< std::string, CitePosition > citePosition
Definition cite.cpp:82
std::unordered_map< int, std::string > formulaCite
Definition cite.cpp:81
Citation-related data.
Definition cite.h:70
Protection
Definition types.h:32
StringVector split(const std::string &s, const std::string &delimiter)
split input string s by string delimiter delimiter.
Definition util.cpp:6568
bool copyFile(const QCString &src, const QCString &dest)
Copies the contents of file with name src to the newly created file with name dest.
Definition util.cpp:5809
A bunch of utility functions.