//===--- CommentSema.cpp - Doxygen comment semantic analysis --------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// #include "clang/AST/CommentSema.h" #include "clang/AST/CommentDiagnostic.h" #include "clang/AST/CommentCommandTraits.h" #include "clang/AST/Decl.h" #include "clang/AST/DeclTemplate.h" #include "clang/Basic/SourceManager.h" #include "llvm/ADT/StringSwitch.h" namespace clang { namespace comments { namespace { #include "clang/AST/CommentHTMLTagsProperties.inc" } // unnamed namespace Sema::Sema(llvm::BumpPtrAllocator &Allocator, const SourceManager &SourceMgr, DiagnosticsEngine &Diags, CommandTraits &Traits) : Allocator(Allocator), SourceMgr(SourceMgr), Diags(Diags), Traits(Traits), ThisDeclInfo(NULL), BriefCommand(NULL), ReturnsCommand(NULL) { } void Sema::setDecl(const Decl *D) { if (!D) return; ThisDeclInfo = new (Allocator) DeclInfo; ThisDeclInfo->ThisDecl = D; ThisDeclInfo->IsFilled = false; } ParagraphComment *Sema::actOnParagraphComment( ArrayRef Content) { return new (Allocator) ParagraphComment(Content); } BlockCommandComment *Sema::actOnBlockCommandStart(SourceLocation LocBegin, SourceLocation LocEnd, unsigned CommandID) { return new (Allocator) BlockCommandComment(LocBegin, LocEnd, CommandID); } void Sema::actOnBlockCommandArgs(BlockCommandComment *Command, ArrayRef Args) { Command->setArgs(Args); } void Sema::actOnBlockCommandFinish(BlockCommandComment *Command, ParagraphComment *Paragraph) { Command->setParagraph(Paragraph); checkBlockCommandEmptyParagraph(Command); checkBlockCommandDuplicate(Command); checkReturnsCommand(Command); } ParamCommandComment *Sema::actOnParamCommandStart(SourceLocation LocBegin, SourceLocation LocEnd, unsigned CommandID) { ParamCommandComment *Command = new (Allocator) ParamCommandComment(LocBegin, LocEnd, CommandID); if (!isFunctionDecl()) Diag(Command->getLocation(), diag::warn_doc_param_not_attached_to_a_function_decl) << Command->getCommandNameRange(Traits); return Command; } void Sema::actOnParamCommandDirectionArg(ParamCommandComment *Command, SourceLocation ArgLocBegin, SourceLocation ArgLocEnd, StringRef Arg) { ParamCommandComment::PassDirection Direction; std::string ArgLower = Arg.lower(); // TODO: optimize: lower Name first (need an API in SmallString for that), // after that StringSwitch. if (ArgLower == "[in]") Direction = ParamCommandComment::In; else if (ArgLower == "[out]") Direction = ParamCommandComment::Out; else if (ArgLower == "[in,out]" || ArgLower == "[out,in]") Direction = ParamCommandComment::InOut; else { // Remove spaces. std::string::iterator O = ArgLower.begin(); for (std::string::iterator I = ArgLower.begin(), E = ArgLower.end(); I != E; ++I) { const char C = *I; if (C != ' ' && C != '\n' && C != '\r' && C != '\t' && C != '\v' && C != '\f') *O++ = C; } ArgLower.resize(O - ArgLower.begin()); bool RemovingWhitespaceHelped = false; if (ArgLower == "[in]") { Direction = ParamCommandComment::In; RemovingWhitespaceHelped = true; } else if (ArgLower == "[out]") { Direction = ParamCommandComment::Out; RemovingWhitespaceHelped = true; } else if (ArgLower == "[in,out]" || ArgLower == "[out,in]") { Direction = ParamCommandComment::InOut; RemovingWhitespaceHelped = true; } else { Direction = ParamCommandComment::In; RemovingWhitespaceHelped = false; } SourceRange ArgRange(ArgLocBegin, ArgLocEnd); if (RemovingWhitespaceHelped) Diag(ArgLocBegin, diag::warn_doc_param_spaces_in_direction) << ArgRange << FixItHint::CreateReplacement( ArgRange, ParamCommandComment::getDirectionAsString(Direction)); else Diag(ArgLocBegin, diag::warn_doc_param_invalid_direction) << ArgRange; } Command->setDirection(Direction, /* Explicit = */ true); } void Sema::actOnParamCommandParamNameArg(ParamCommandComment *Command, SourceLocation ArgLocBegin, SourceLocation ArgLocEnd, StringRef Arg) { // Parser will not feed us more arguments than needed. assert(Command->getNumArgs() == 0); if (!Command->isDirectionExplicit()) { // User didn't provide a direction argument. Command->setDirection(ParamCommandComment::In, /* Explicit = */ false); } typedef BlockCommandComment::Argument Argument; Argument *A = new (Allocator) Argument(SourceRange(ArgLocBegin, ArgLocEnd), Arg); Command->setArgs(llvm::makeArrayRef(A, 1)); } void Sema::actOnParamCommandFinish(ParamCommandComment *Command, ParagraphComment *Paragraph) { Command->setParagraph(Paragraph); checkBlockCommandEmptyParagraph(Command); } TParamCommandComment *Sema::actOnTParamCommandStart(SourceLocation LocBegin, SourceLocation LocEnd, unsigned CommandID) { TParamCommandComment *Command = new (Allocator) TParamCommandComment(LocBegin, LocEnd, CommandID); if (!isTemplateOrSpecialization()) Diag(Command->getLocation(), diag::warn_doc_tparam_not_attached_to_a_template_decl) << Command->getCommandNameRange(Traits); return Command; } void Sema::actOnTParamCommandParamNameArg(TParamCommandComment *Command, SourceLocation ArgLocBegin, SourceLocation ArgLocEnd, StringRef Arg) { // Parser will not feed us more arguments than needed. assert(Command->getNumArgs() == 0); typedef BlockCommandComment::Argument Argument; Argument *A = new (Allocator) Argument(SourceRange(ArgLocBegin, ArgLocEnd), Arg); Command->setArgs(llvm::makeArrayRef(A, 1)); if (!isTemplateOrSpecialization()) { // We already warned that this \\tparam is not attached to a template decl. return; } const TemplateParameterList *TemplateParameters = ThisDeclInfo->TemplateParameters; SmallVector Position; if (resolveTParamReference(Arg, TemplateParameters, &Position)) { Command->setPosition(copyArray(llvm::makeArrayRef(Position))); llvm::StringMap::iterator PrevCommandIt = TemplateParameterDocs.find(Arg); if (PrevCommandIt != TemplateParameterDocs.end()) { SourceRange ArgRange(ArgLocBegin, ArgLocEnd); Diag(ArgLocBegin, diag::warn_doc_tparam_duplicate) << Arg << ArgRange; TParamCommandComment *PrevCommand = PrevCommandIt->second; Diag(PrevCommand->getLocation(), diag::note_doc_tparam_previous) << PrevCommand->getParamNameRange(); } TemplateParameterDocs[Arg] = Command; return; } SourceRange ArgRange(ArgLocBegin, ArgLocEnd); Diag(ArgLocBegin, diag::warn_doc_tparam_not_found) << Arg << ArgRange; if (!TemplateParameters || TemplateParameters->size() == 0) return; StringRef CorrectedName; if (TemplateParameters->size() == 1) { const NamedDecl *Param = TemplateParameters->getParam(0); const IdentifierInfo *II = Param->getIdentifier(); if (II) CorrectedName = II->getName(); } else { CorrectedName = correctTypoInTParamReference(Arg, TemplateParameters); } if (!CorrectedName.empty()) { Diag(ArgLocBegin, diag::note_doc_tparam_name_suggestion) << CorrectedName << FixItHint::CreateReplacement(ArgRange, CorrectedName); } return; } void Sema::actOnTParamCommandFinish(TParamCommandComment *Command, ParagraphComment *Paragraph) { Command->setParagraph(Paragraph); checkBlockCommandEmptyParagraph(Command); } InlineCommandComment *Sema::actOnInlineCommand(SourceLocation CommandLocBegin, SourceLocation CommandLocEnd, unsigned CommandID) { ArrayRef Args; StringRef CommandName = Traits.getCommandInfo(CommandID)->Name; return new (Allocator) InlineCommandComment( CommandLocBegin, CommandLocEnd, CommandID, getInlineCommandRenderKind(CommandName), Args); } InlineCommandComment *Sema::actOnInlineCommand(SourceLocation CommandLocBegin, SourceLocation CommandLocEnd, unsigned CommandID, SourceLocation ArgLocBegin, SourceLocation ArgLocEnd, StringRef Arg) { typedef InlineCommandComment::Argument Argument; Argument *A = new (Allocator) Argument(SourceRange(ArgLocBegin, ArgLocEnd), Arg); StringRef CommandName = Traits.getCommandInfo(CommandID)->Name; return new (Allocator) InlineCommandComment( CommandLocBegin, CommandLocEnd, CommandID, getInlineCommandRenderKind(CommandName), llvm::makeArrayRef(A, 1)); } InlineContentComment *Sema::actOnUnknownCommand(SourceLocation LocBegin, SourceLocation LocEnd, StringRef Name) { ArrayRef Args; unsigned CommandID = Traits.registerUnknownCommand(Name)->getID(); return new (Allocator) InlineCommandComment( LocBegin, LocEnd, CommandID, InlineCommandComment::RenderNormal, Args); } TextComment *Sema::actOnText(SourceLocation LocBegin, SourceLocation LocEnd, StringRef Text) { return new (Allocator) TextComment(LocBegin, LocEnd, Text); } VerbatimBlockComment *Sema::actOnVerbatimBlockStart(SourceLocation Loc, unsigned CommandID) { StringRef CommandName = Traits.getCommandInfo(CommandID)->Name; return new (Allocator) VerbatimBlockComment( Loc, Loc.getLocWithOffset(1 + CommandName.size()), CommandID); } VerbatimBlockLineComment *Sema::actOnVerbatimBlockLine(SourceLocation Loc, StringRef Text) { return new (Allocator) VerbatimBlockLineComment(Loc, Text); } void Sema::actOnVerbatimBlockFinish( VerbatimBlockComment *Block, SourceLocation CloseNameLocBegin, StringRef CloseName, ArrayRef Lines) { Block->setCloseName(CloseName, CloseNameLocBegin); Block->setLines(Lines); } VerbatimLineComment *Sema::actOnVerbatimLine(SourceLocation LocBegin, unsigned CommandID, SourceLocation TextBegin, StringRef Text) { return new (Allocator) VerbatimLineComment( LocBegin, TextBegin.getLocWithOffset(Text.size()), CommandID, TextBegin, Text); } HTMLStartTagComment *Sema::actOnHTMLStartTagStart(SourceLocation LocBegin, StringRef TagName) { return new (Allocator) HTMLStartTagComment(LocBegin, TagName); } void Sema::actOnHTMLStartTagFinish( HTMLStartTagComment *Tag, ArrayRef Attrs, SourceLocation GreaterLoc, bool IsSelfClosing) { Tag->setAttrs(Attrs); Tag->setGreaterLoc(GreaterLoc); if (IsSelfClosing) Tag->setSelfClosing(); else if (!isHTMLEndTagForbidden(Tag->getTagName())) HTMLOpenTags.push_back(Tag); } HTMLEndTagComment *Sema::actOnHTMLEndTag(SourceLocation LocBegin, SourceLocation LocEnd, StringRef TagName) { HTMLEndTagComment *HET = new (Allocator) HTMLEndTagComment(LocBegin, LocEnd, TagName); if (isHTMLEndTagForbidden(TagName)) { Diag(HET->getLocation(), diag::warn_doc_html_end_forbidden) << TagName << HET->getSourceRange(); return HET; } bool FoundOpen = false; for (SmallVectorImpl::const_reverse_iterator I = HTMLOpenTags.rbegin(), E = HTMLOpenTags.rend(); I != E; ++I) { if ((*I)->getTagName() == TagName) { FoundOpen = true; break; } } if (!FoundOpen) { Diag(HET->getLocation(), diag::warn_doc_html_end_unbalanced) << HET->getSourceRange(); return HET; } while (!HTMLOpenTags.empty()) { const HTMLStartTagComment *HST = HTMLOpenTags.back(); HTMLOpenTags.pop_back(); StringRef LastNotClosedTagName = HST->getTagName(); if (LastNotClosedTagName == TagName) break; if (isHTMLEndTagOptional(LastNotClosedTagName)) continue; bool OpenLineInvalid; const unsigned OpenLine = SourceMgr.getPresumedLineNumber( HST->getLocation(), &OpenLineInvalid); bool CloseLineInvalid; const unsigned CloseLine = SourceMgr.getPresumedLineNumber( HET->getLocation(), &CloseLineInvalid); if (OpenLineInvalid || CloseLineInvalid || OpenLine == CloseLine) Diag(HST->getLocation(), diag::warn_doc_html_start_end_mismatch) << HST->getTagName() << HET->getTagName() << HST->getSourceRange() << HET->getSourceRange(); else { Diag(HST->getLocation(), diag::warn_doc_html_start_end_mismatch) << HST->getTagName() << HET->getTagName() << HST->getSourceRange(); Diag(HET->getLocation(), diag::note_doc_html_end_tag) << HET->getSourceRange(); } } return HET; } FullComment *Sema::actOnFullComment( ArrayRef Blocks) { FullComment *FC = new (Allocator) FullComment(Blocks, ThisDeclInfo); resolveParamCommandIndexes(FC); return FC; } void Sema::checkBlockCommandEmptyParagraph(BlockCommandComment *Command) { ParagraphComment *Paragraph = Command->getParagraph(); if (Paragraph->isWhitespace()) { SourceLocation DiagLoc; if (Command->getNumArgs() > 0) DiagLoc = Command->getArgRange(Command->getNumArgs() - 1).getEnd(); if (!DiagLoc.isValid()) DiagLoc = Command->getCommandNameRange(Traits).getEnd(); Diag(DiagLoc, diag::warn_doc_block_command_empty_paragraph) << Command->getCommandName(Traits) << Command->getSourceRange(); } } void Sema::checkReturnsCommand(const BlockCommandComment *Command) { if (!Traits.getCommandInfo(Command->getCommandID())->IsReturnsCommand) return; if (isFunctionDecl()) { if (ThisDeclInfo->ResultType->isVoidType()) { unsigned DiagKind; switch (ThisDeclInfo->ThisDecl->getKind()) { default: if (ThisDeclInfo->IsObjCMethod) DiagKind = 3; else DiagKind = 0; break; case Decl::CXXConstructor: DiagKind = 1; break; case Decl::CXXDestructor: DiagKind = 2; break; } Diag(Command->getLocation(), diag::warn_doc_returns_attached_to_a_void_function) << Command->getCommandName(Traits) << DiagKind << Command->getSourceRange(); } return; } Diag(Command->getLocation(), diag::warn_doc_returns_not_attached_to_a_function_decl) << Command->getCommandName(Traits) << Command->getSourceRange(); } void Sema::checkBlockCommandDuplicate(const BlockCommandComment *Command) { const CommandInfo *Info = Traits.getCommandInfo(Command->getCommandID()); const BlockCommandComment *PrevCommand = NULL; if (Info->IsBriefCommand) { if (!BriefCommand) { BriefCommand = Command; return; } PrevCommand = BriefCommand; } else if (Info->IsReturnsCommand) { if (!ReturnsCommand) { ReturnsCommand = Command; return; } PrevCommand = ReturnsCommand; } else { // We don't want to check this command for duplicates. return; } StringRef CommandName = Command->getCommandName(Traits); StringRef PrevCommandName = PrevCommand->getCommandName(Traits); Diag(Command->getLocation(), diag::warn_doc_block_command_duplicate) << CommandName << Command->getSourceRange(); if (CommandName == PrevCommandName) Diag(PrevCommand->getLocation(), diag::note_doc_block_command_previous) << PrevCommandName << PrevCommand->getSourceRange(); else Diag(PrevCommand->getLocation(), diag::note_doc_block_command_previous_alias) << PrevCommandName << CommandName; } void Sema::resolveParamCommandIndexes(const FullComment *FC) { if (!isFunctionDecl()) { // We already warned that \\param commands are not attached to a function // decl. return; } llvm::SmallVector UnresolvedParamCommands; // Comment AST nodes that correspond to \c ParamVars for which we have // found a \\param command or NULL if no documentation was found so far. llvm::SmallVector ParamVarDocs; ArrayRef ParamVars = getParamVars(); ParamVarDocs.resize(ParamVars.size(), NULL); // First pass over all \\param commands: resolve all parameter names. for (Comment::child_iterator I = FC->child_begin(), E = FC->child_end(); I != E; ++I) { ParamCommandComment *PCC = dyn_cast(*I); if (!PCC || !PCC->hasParamName()) continue; StringRef ParamName = PCC->getParamName(); // Check that referenced parameter name is in the function decl. const unsigned ResolvedParamIndex = resolveParmVarReference(ParamName, ParamVars); if (ResolvedParamIndex == ParamCommandComment::InvalidParamIndex) { UnresolvedParamCommands.push_back(PCC); continue; } PCC->setParamIndex(ResolvedParamIndex); if (ParamVarDocs[ResolvedParamIndex]) { SourceRange ArgRange = PCC->getParamNameRange(); Diag(ArgRange.getBegin(), diag::warn_doc_param_duplicate) << ParamName << ArgRange; ParamCommandComment *PrevCommand = ParamVarDocs[ResolvedParamIndex]; Diag(PrevCommand->getLocation(), diag::note_doc_param_previous) << PrevCommand->getParamNameRange(); } ParamVarDocs[ResolvedParamIndex] = PCC; } // Find parameter declarations that have no corresponding \\param. llvm::SmallVector OrphanedParamDecls; for (unsigned i = 0, e = ParamVarDocs.size(); i != e; ++i) { if (!ParamVarDocs[i]) OrphanedParamDecls.push_back(ParamVars[i]); } // Second pass over unresolved \\param commands: do typo correction. // Suggest corrections from a set of parameter declarations that have no // corresponding \\param. for (unsigned i = 0, e = UnresolvedParamCommands.size(); i != e; ++i) { const ParamCommandComment *PCC = UnresolvedParamCommands[i]; SourceRange ArgRange = PCC->getParamNameRange(); StringRef ParamName = PCC->getParamName(); Diag(ArgRange.getBegin(), diag::warn_doc_param_not_found) << ParamName << ArgRange; // All parameters documented -- can't suggest a correction. if (OrphanedParamDecls.size() == 0) continue; unsigned CorrectedParamIndex = ParamCommandComment::InvalidParamIndex; if (OrphanedParamDecls.size() == 1) { // If one parameter is not documented then that parameter is the only // possible suggestion. CorrectedParamIndex = 0; } else { // Do typo correction. CorrectedParamIndex = correctTypoInParmVarReference(ParamName, OrphanedParamDecls); } if (CorrectedParamIndex != ParamCommandComment::InvalidParamIndex) { const ParmVarDecl *CorrectedPVD = OrphanedParamDecls[CorrectedParamIndex]; if (const IdentifierInfo *CorrectedII = CorrectedPVD->getIdentifier()) Diag(ArgRange.getBegin(), diag::note_doc_param_name_suggestion) << CorrectedII->getName() << FixItHint::CreateReplacement(ArgRange, CorrectedII->getName()); } } } bool Sema::isFunctionDecl() { if (!ThisDeclInfo) return false; if (!ThisDeclInfo->IsFilled) inspectThisDecl(); return ThisDeclInfo->getKind() == DeclInfo::FunctionKind; } bool Sema::isTemplateOrSpecialization() { if (!ThisDeclInfo) return false; if (!ThisDeclInfo->IsFilled) inspectThisDecl(); return ThisDeclInfo->getTemplateKind() != DeclInfo::NotTemplate; } ArrayRef Sema::getParamVars() { if (!ThisDeclInfo->IsFilled) inspectThisDecl(); return ThisDeclInfo->ParamVars; } void Sema::inspectThisDecl() { ThisDeclInfo->fill(); } unsigned Sema::resolveParmVarReference(StringRef Name, ArrayRef ParamVars) { for (unsigned i = 0, e = ParamVars.size(); i != e; ++i) { const IdentifierInfo *II = ParamVars[i]->getIdentifier(); if (II && II->getName() == Name) return i; } return ParamCommandComment::InvalidParamIndex; } namespace { class SimpleTypoCorrector { StringRef Typo; const unsigned MaxEditDistance; const NamedDecl *BestDecl; unsigned BestEditDistance; unsigned BestIndex; unsigned NextIndex; public: SimpleTypoCorrector(StringRef Typo) : Typo(Typo), MaxEditDistance((Typo.size() + 2) / 3), BestDecl(NULL), BestEditDistance(MaxEditDistance + 1), BestIndex(0), NextIndex(0) { } void addDecl(const NamedDecl *ND); const NamedDecl *getBestDecl() const { if (BestEditDistance > MaxEditDistance) return NULL; return BestDecl; } unsigned getBestDeclIndex() const { assert(getBestDecl()); return BestIndex; } }; void SimpleTypoCorrector::addDecl(const NamedDecl *ND) { unsigned CurrIndex = NextIndex++; const IdentifierInfo *II = ND->getIdentifier(); if (!II) return; StringRef Name = II->getName(); unsigned MinPossibleEditDistance = abs((int)Name.size() - (int)Typo.size()); if (MinPossibleEditDistance > 0 && Typo.size() / MinPossibleEditDistance < 3) return; unsigned EditDistance = Typo.edit_distance(Name, true, MaxEditDistance); if (EditDistance < BestEditDistance) { BestEditDistance = EditDistance; BestDecl = ND; BestIndex = CurrIndex; } } } // unnamed namespace unsigned Sema::correctTypoInParmVarReference( StringRef Typo, ArrayRef ParamVars) { SimpleTypoCorrector Corrector(Typo); for (unsigned i = 0, e = ParamVars.size(); i != e; ++i) Corrector.addDecl(ParamVars[i]); if (Corrector.getBestDecl()) return Corrector.getBestDeclIndex(); else return ParamCommandComment::InvalidParamIndex; } namespace { bool ResolveTParamReferenceHelper( StringRef Name, const TemplateParameterList *TemplateParameters, SmallVectorImpl *Position) { for (unsigned i = 0, e = TemplateParameters->size(); i != e; ++i) { const NamedDecl *Param = TemplateParameters->getParam(i); const IdentifierInfo *II = Param->getIdentifier(); if (II && II->getName() == Name) { Position->push_back(i); return true; } if (const TemplateTemplateParmDecl *TTP = dyn_cast(Param)) { Position->push_back(i); if (ResolveTParamReferenceHelper(Name, TTP->getTemplateParameters(), Position)) return true; Position->pop_back(); } } return false; } } // unnamed namespace bool Sema::resolveTParamReference( StringRef Name, const TemplateParameterList *TemplateParameters, SmallVectorImpl *Position) { Position->clear(); if (!TemplateParameters) return false; return ResolveTParamReferenceHelper(Name, TemplateParameters, Position); } namespace { void CorrectTypoInTParamReferenceHelper( const TemplateParameterList *TemplateParameters, SimpleTypoCorrector &Corrector) { for (unsigned i = 0, e = TemplateParameters->size(); i != e; ++i) { const NamedDecl *Param = TemplateParameters->getParam(i); Corrector.addDecl(Param); if (const TemplateTemplateParmDecl *TTP = dyn_cast(Param)) CorrectTypoInTParamReferenceHelper(TTP->getTemplateParameters(), Corrector); } } } // unnamed namespace StringRef Sema::correctTypoInTParamReference( StringRef Typo, const TemplateParameterList *TemplateParameters) { SimpleTypoCorrector Corrector(Typo); CorrectTypoInTParamReferenceHelper(TemplateParameters, Corrector); if (const NamedDecl *ND = Corrector.getBestDecl()) { const IdentifierInfo *II = ND->getIdentifier(); assert(II && "SimpleTypoCorrector should not return this decl"); return II->getName(); } return StringRef(); } InlineCommandComment::RenderKind Sema::getInlineCommandRenderKind(StringRef Name) const { assert(Traits.getCommandInfo(Name)->IsInlineCommand); return llvm::StringSwitch(Name) .Case("b", InlineCommandComment::RenderBold) .Cases("c", "p", InlineCommandComment::RenderMonospaced) .Cases("a", "e", "em", InlineCommandComment::RenderEmphasized) .Default(InlineCommandComment::RenderNormal); } } // end namespace comments } // end namespace clang