• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 //===--- Format.h - Format C++ code -----------------------------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 ///
10 /// \file
11 /// Various functions to configurably format source code.
12 ///
13 //===----------------------------------------------------------------------===//
14 
15 #ifndef LLVM_CLANG_FORMAT_FORMAT_H
16 #define LLVM_CLANG_FORMAT_FORMAT_H
17 
18 #include "clang/Frontend/FrontendAction.h"
19 #include "clang/Tooling/Refactoring.h"
20 #include <system_error>
21 
22 namespace clang {
23 
24 class Lexer;
25 class SourceManager;
26 class DiagnosticConsumer;
27 
28 namespace format {
29 
30 enum class ParseError { Success = 0, Error, Unsuitable };
31 class ParseErrorCategory final : public std::error_category {
32 public:
33   const char *name() const LLVM_NOEXCEPT override;
34   std::string message(int EV) const override;
35 };
36 const std::error_category &getParseCategory();
37 std::error_code make_error_code(ParseError e);
38 
39 /// \brief The \c FormatStyle is used to configure the formatting to follow
40 /// specific guidelines.
41 struct FormatStyle {
42   /// \brief Supported languages. When stored in a configuration file, specifies
43   /// the language, that the configuration targets. When passed to the
44   /// reformat() function, enables syntax features specific to the language.
45   enum LanguageKind {
46     /// Do not use.
47     LK_None,
48     /// Should be used for C, C++, ObjectiveC, ObjectiveC++.
49     LK_Cpp,
50     /// Should be used for JavaScript.
51     LK_JavaScript,
52     /// Should be used for Protocol Buffers
53     /// (https://developers.google.com/protocol-buffers/).
54     LK_Proto
55   };
56 
57   /// \brief Language, this format style is targeted at.
58   LanguageKind Language;
59 
60   /// \brief The column limit.
61   ///
62   /// A column limit of \c 0 means that there is no column limit. In this case,
63   /// clang-format will respect the input's line breaking decisions within
64   /// statements unless they contradict other rules.
65   unsigned ColumnLimit;
66 
67   /// \brief The maximum number of consecutive empty lines to keep.
68   unsigned MaxEmptyLinesToKeep;
69 
70   /// \brief If true, empty lines at the start of blocks are kept.
71   bool KeepEmptyLinesAtTheStartOfBlocks;
72 
73   /// \brief The penalty for each line break introduced inside a comment.
74   unsigned PenaltyBreakComment;
75 
76   /// \brief The penalty for each line break introduced inside a string literal.
77   unsigned PenaltyBreakString;
78 
79   /// \brief The penalty for each character outside of the column limit.
80   unsigned PenaltyExcessCharacter;
81 
82   /// \brief The penalty for breaking before the first \c <<.
83   unsigned PenaltyBreakFirstLessLess;
84 
85   /// \brief The penalty for breaking a function call after "call(".
86   unsigned PenaltyBreakBeforeFirstCallParameter;
87 
88   /// \brief The & and * alignment style.
89   enum PointerAlignmentStyle {
90     /// Align pointer to the left.
91     PAS_Left,
92     /// Align pointer to the right.
93     PAS_Right,
94     /// Align pointer in the middle.
95     PAS_Middle
96   };
97 
98   /// Pointer and reference alignment style.
99   PointerAlignmentStyle PointerAlignment;
100 
101   /// \brief If \c true, analyze the formatted file for the most common
102   /// alignment of & and *. \c PointerAlignment is then used only as fallback.
103   bool DerivePointerAlignment;
104 
105   /// \brief The extra indent or outdent of access modifiers, e.g. \c public:.
106   int AccessModifierOffset;
107 
108   /// \brief Supported language standards.
109   enum LanguageStandard {
110     /// Use C++03-compatible syntax.
111     LS_Cpp03,
112     /// Use features of C++11 (e.g. \c A<A<int>> instead of
113     /// <tt>A<A<int> ></tt>).
114     LS_Cpp11,
115     /// Automatic detection based on the input.
116     LS_Auto
117   };
118 
119   /// \brief Format compatible with this standard, e.g. use
120   /// <tt>A<A<int> ></tt> instead of \c A<A<int>> for LS_Cpp03.
121   LanguageStandard Standard;
122 
123   /// \brief Indent case labels one level from the switch statement.
124   ///
125   /// When \c false, use the same indentation level as for the switch statement.
126   /// Switch statement body is always indented one level more than case labels.
127   bool IndentCaseLabels;
128 
129   /// \brief Indent if a function definition or declaration is wrapped after the
130   /// type.
131   bool IndentWrappedFunctionNames;
132 
133   /// \brief Different ways to indent namespace contents.
134   enum NamespaceIndentationKind {
135     /// Don't indent in namespaces.
136     NI_None,
137     /// Indent only in inner namespaces (nested in other namespaces).
138     NI_Inner,
139     /// Indent in all namespaces.
140     NI_All
141   };
142 
143   /// \brief The indentation used for namespaces.
144   NamespaceIndentationKind NamespaceIndentation;
145 
146   /// \brief The number of spaces before trailing line comments
147   /// (\c // - comments).
148   ///
149   /// This does not affect trailing block comments (\c /**/ - comments) as those
150   /// commonly have different usage patterns and a number of special cases.
151   unsigned SpacesBeforeTrailingComments;
152 
153   /// \brief If \c false, a function call's or function definition's parameters
154   /// will either all be on the same line or will have one line each.
155   bool BinPackParameters;
156 
157   /// \brief If \c true, clang-format detects whether function calls and
158   /// definitions are formatted with one parameter per line.
159   ///
160   /// Each call can be bin-packed, one-per-line or inconclusive. If it is
161   /// inconclusive, e.g. completely on one line, but a decision needs to be
162   /// made, clang-format analyzes whether there are other bin-packed cases in
163   /// the input file and act accordingly.
164   ///
165   /// NOTE: This is an experimental flag, that might go away or be renamed. Do
166   /// not use this in config files, etc. Use at your own risk.
167   bool ExperimentalAutoDetectBinPacking;
168 
169   /// \brief Allow putting all parameters of a function declaration onto
170   /// the next line even if \c BinPackParameters is \c false.
171   bool AllowAllParametersOfDeclarationOnNextLine;
172 
173   /// \brief Penalty for putting the return type of a function onto its own
174   /// line.
175   unsigned PenaltyReturnTypeOnItsOwnLine;
176 
177   /// \brief If the constructor initializers don't fit on a line, put each
178   /// initializer on its own line.
179   bool ConstructorInitializerAllOnOneLineOrOnePerLine;
180 
181   /// \brief Always break constructor initializers before commas and align
182   /// the commas with the colon.
183   bool BreakConstructorInitializersBeforeComma;
184 
185   /// \brief Allows contracting simple braced statements to a single line.
186   ///
187   /// E.g., this allows <tt>if (a) { return; }</tt> to be put on a single line.
188   bool AllowShortBlocksOnASingleLine;
189 
190   /// \brief If \c true, <tt>if (a) return;</tt> can be put on a single
191   /// line.
192   bool AllowShortIfStatementsOnASingleLine;
193 
194   /// \brief If \c true, <tt>while (true) continue;</tt> can be put on a
195   /// single line.
196   bool AllowShortLoopsOnASingleLine;
197 
198   /// \brief Different styles for merging short functions containing at most one
199   /// statement.
200   enum ShortFunctionStyle {
201     /// \brief Never merge functions into a single line.
202     SFS_None,
203     /// \brief Only merge functions defined inside a class.
204     SFS_Inline,
205     /// \brief Merge all functions fitting on a single line.
206     SFS_All,
207   };
208 
209   /// \brief Dependent on the value, <tt>int f() { return 0; }</tt> can be put
210   /// on a single line.
211   ShortFunctionStyle AllowShortFunctionsOnASingleLine;
212 
213   /// \brief Add a space after \c @property in Objective-C, i.e. use
214   /// <tt>\@property (readonly)</tt> instead of <tt>\@property(readonly)</tt>.
215   bool ObjCSpaceAfterProperty;
216 
217   /// \brief Add a space in front of an Objective-C protocol list, i.e. use
218   /// <tt>Foo <Protocol></tt> instead of \c Foo<Protocol>.
219   bool ObjCSpaceBeforeProtocolList;
220 
221   /// \brief If \c true, aligns trailing comments.
222   bool AlignTrailingComments;
223 
224   /// \brief If \c true, aligns escaped newlines as far left as possible.
225   /// Otherwise puts them into the right-most column.
226   bool AlignEscapedNewlinesLeft;
227 
228   /// \brief The number of columns to use for indentation.
229   unsigned IndentWidth;
230 
231   /// \brief The number of columns used for tab stops.
232   unsigned TabWidth;
233 
234   /// \brief The number of characters to use for indentation of constructor
235   /// initializer lists.
236   unsigned ConstructorInitializerIndentWidth;
237 
238   /// \brief If \c true, always break after the <tt>template<...></tt> of a
239   /// template declaration.
240   bool AlwaysBreakTemplateDeclarations;
241 
242   /// \brief If \c true, always break before multiline string literals.
243   bool AlwaysBreakBeforeMultilineStrings;
244 
245   /// \brief Different ways to use tab in formatting.
246   enum UseTabStyle {
247     /// Never use tab.
248     UT_Never,
249     /// Use tabs only for indentation.
250     UT_ForIndentation,
251     /// Use tabs whenever we need to fill whitespace that spans at least from
252     /// one tab stop to the next one.
253     UT_Always
254   };
255 
256   /// \brief The way to use tab characters in the resulting file.
257   UseTabStyle UseTab;
258 
259   /// \brief If \c true, binary operators will be placed after line breaks.
260   bool BreakBeforeBinaryOperators;
261 
262   /// \brief If \c true, ternary operators will be placed after line breaks.
263   bool BreakBeforeTernaryOperators;
264 
265   /// \brief Different ways to attach braces to their surrounding context.
266   enum BraceBreakingStyle {
267     /// Always attach braces to surrounding context.
268     BS_Attach,
269     /// Like \c Attach, but break before braces on function, namespace and
270     /// class definitions.
271     BS_Linux,
272     /// Like \c Attach, but break before function definitions.
273     BS_Stroustrup,
274     /// Always break before braces.
275     BS_Allman,
276     /// Always break before braces and add an extra level of indentation to
277     /// braces of control statements, not to those of class, function
278     /// or other definitions.
279     BS_GNU
280   };
281 
282   /// \brief The brace breaking style to use.
283   BraceBreakingStyle BreakBeforeBraces;
284 
285   /// \brief If \c true, format braced lists as best suited for C++11 braced
286   /// lists.
287   ///
288   /// Important differences:
289   /// - No spaces inside the braced list.
290   /// - No line break before the closing brace.
291   /// - Indentation with the continuation indent, not with the block indent.
292   ///
293   /// Fundamentally, C++11 braced lists are formatted exactly like function
294   /// calls would be formatted in their place. If the braced list follows a name
295   /// (e.g. a type or variable name), clang-format formats as if the \c {} were
296   /// the parentheses of a function call with that name. If there is no name,
297   /// a zero-length name is assumed.
298   bool Cpp11BracedListStyle;
299 
300   /// \brief If \c true, spaces will be inserted after '(' and before ')'.
301   bool SpacesInParentheses;
302 
303   /// \brief If \c true, spaces will be inserted after '<' and before '>' in
304   /// template argument lists
305   bool SpacesInAngles;
306 
307   /// \brief If \c true, spaces may be inserted into '()'.
308   bool SpaceInEmptyParentheses;
309 
310   /// \brief If \c true, spaces are inserted inside container literals (e.g.
311   /// ObjC and Javascript array and dict literals).
312   bool SpacesInContainerLiterals;
313 
314   /// \brief If \c true, spaces may be inserted into C style casts.
315   bool SpacesInCStyleCastParentheses;
316 
317   /// \brief Different ways to put a space before opening parentheses.
318   enum SpaceBeforeParensOptions {
319     /// Never put a space before opening parentheses.
320     SBPO_Never,
321     /// Put a space before opening parentheses only after control statement
322     /// keywords (<tt>for/if/while...</tt>).
323     SBPO_ControlStatements,
324     /// Always put a space before opening parentheses, except when it's
325     /// prohibited by the syntax rules (in function-like macro definitions) or
326     /// when determined by other style rules (after unary operators, opening
327     /// parentheses, etc.)
328     SBPO_Always
329   };
330 
331   /// \brief Defines in which cases to put a space before opening parentheses.
332   SpaceBeforeParensOptions SpaceBeforeParens;
333 
334   /// \brief If \c false, spaces will be removed before assignment operators.
335   bool SpaceBeforeAssignmentOperators;
336 
337   /// \brief Indent width for line continuations.
338   unsigned ContinuationIndentWidth;
339 
340   /// \brief A regular expression that describes comments with special meaning,
341   /// which should not be split into lines or otherwise changed.
342   std::string CommentPragmas;
343 
344   /// \brief Disables formatting at all.
345   bool DisableFormat;
346 
347   /// \brief A vector of macros that should be interpreted as foreach loops
348   /// instead of as function calls.
349   ///
350   /// These are expected to be macros of the form:
351   /// \code
352   /// FOREACH(<variable-declaration>, ...)
353   ///   <loop-body>
354   /// \endcode
355   ///
356   /// For example: BOOST_FOREACH.
357   std::vector<std::string> ForEachMacros;
358 
359   bool operator==(const FormatStyle &R) const {
360     return AccessModifierOffset == R.AccessModifierOffset &&
361            ConstructorInitializerIndentWidth ==
362                R.ConstructorInitializerIndentWidth &&
363            AlignEscapedNewlinesLeft == R.AlignEscapedNewlinesLeft &&
364            AlignTrailingComments == R.AlignTrailingComments &&
365            AllowAllParametersOfDeclarationOnNextLine ==
366                R.AllowAllParametersOfDeclarationOnNextLine &&
367            AllowShortFunctionsOnASingleLine ==
368                R.AllowShortFunctionsOnASingleLine &&
369            AllowShortBlocksOnASingleLine == R.AllowShortBlocksOnASingleLine &&
370            AllowShortIfStatementsOnASingleLine ==
371                R.AllowShortIfStatementsOnASingleLine &&
372            AllowShortLoopsOnASingleLine == R.AllowShortLoopsOnASingleLine &&
373            AlwaysBreakTemplateDeclarations ==
374                R.AlwaysBreakTemplateDeclarations &&
375            AlwaysBreakBeforeMultilineStrings ==
376                R.AlwaysBreakBeforeMultilineStrings &&
377            BinPackParameters == R.BinPackParameters &&
378            BreakBeforeBinaryOperators == R.BreakBeforeBinaryOperators &&
379            BreakBeforeTernaryOperators == R.BreakBeforeTernaryOperators &&
380            BreakBeforeBraces == R.BreakBeforeBraces &&
381            BreakConstructorInitializersBeforeComma ==
382                R.BreakConstructorInitializersBeforeComma &&
383            ColumnLimit == R.ColumnLimit &&
384            ConstructorInitializerAllOnOneLineOrOnePerLine ==
385                R.ConstructorInitializerAllOnOneLineOrOnePerLine &&
386            DerivePointerAlignment == R.DerivePointerAlignment &&
387            ExperimentalAutoDetectBinPacking ==
388                R.ExperimentalAutoDetectBinPacking &&
389            IndentCaseLabels == R.IndentCaseLabels &&
390            IndentWrappedFunctionNames == R.IndentWrappedFunctionNames &&
391            IndentWidth == R.IndentWidth && Language == R.Language &&
392            MaxEmptyLinesToKeep == R.MaxEmptyLinesToKeep &&
393            KeepEmptyLinesAtTheStartOfBlocks ==
394                R.KeepEmptyLinesAtTheStartOfBlocks &&
395            NamespaceIndentation == R.NamespaceIndentation &&
396            ObjCSpaceAfterProperty == R.ObjCSpaceAfterProperty &&
397            ObjCSpaceBeforeProtocolList == R.ObjCSpaceBeforeProtocolList &&
398            PenaltyBreakComment == R.PenaltyBreakComment &&
399            PenaltyBreakFirstLessLess == R.PenaltyBreakFirstLessLess &&
400            PenaltyBreakString == R.PenaltyBreakString &&
401            PenaltyExcessCharacter == R.PenaltyExcessCharacter &&
402            PenaltyReturnTypeOnItsOwnLine == R.PenaltyReturnTypeOnItsOwnLine &&
403            PointerAlignment == R.PointerAlignment &&
404            SpacesBeforeTrailingComments == R.SpacesBeforeTrailingComments &&
405            Cpp11BracedListStyle == R.Cpp11BracedListStyle &&
406            Standard == R.Standard && TabWidth == R.TabWidth &&
407            UseTab == R.UseTab && SpacesInParentheses == R.SpacesInParentheses &&
408            SpacesInAngles == R.SpacesInAngles &&
409            SpaceInEmptyParentheses == R.SpaceInEmptyParentheses &&
410            SpacesInContainerLiterals == R.SpacesInContainerLiterals &&
411            SpacesInCStyleCastParentheses == R.SpacesInCStyleCastParentheses &&
412            SpaceBeforeParens == R.SpaceBeforeParens &&
413            SpaceBeforeAssignmentOperators == R.SpaceBeforeAssignmentOperators &&
414            ContinuationIndentWidth == R.ContinuationIndentWidth &&
415            CommentPragmas == R.CommentPragmas &&
416            ForEachMacros == R.ForEachMacros;
417   }
418 };
419 
420 /// \brief Returns a format style complying with the LLVM coding standards:
421 /// http://llvm.org/docs/CodingStandards.html.
422 FormatStyle getLLVMStyle();
423 
424 /// \brief Returns a format style complying with one of Google's style guides:
425 /// http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml.
426 /// http://google-styleguide.googlecode.com/svn/trunk/javascriptguide.xml.
427 /// https://developers.google.com/protocol-buffers/docs/style.
428 FormatStyle getGoogleStyle(FormatStyle::LanguageKind Language);
429 
430 /// \brief Returns a format style complying with Chromium's style guide:
431 /// http://www.chromium.org/developers/coding-style.
432 FormatStyle getChromiumStyle(FormatStyle::LanguageKind Language);
433 
434 /// \brief Returns a format style complying with Mozilla's style guide:
435 /// https://developer.mozilla.org/en-US/docs/Developer_Guide/Coding_Style.
436 FormatStyle getMozillaStyle();
437 
438 /// \brief Returns a format style complying with Webkit's style guide:
439 /// http://www.webkit.org/coding/coding-style.html
440 FormatStyle getWebKitStyle();
441 
442 /// \brief Returns a format style complying with GNU Coding Standards:
443 /// http://www.gnu.org/prep/standards/standards.html
444 FormatStyle getGNUStyle();
445 
446 /// \brief Returns style indicating formatting should be not applied at all.
447 FormatStyle getNoStyle();
448 
449 /// \brief Gets a predefined style for the specified language by name.
450 ///
451 /// Currently supported names: LLVM, Google, Chromium, Mozilla. Names are
452 /// compared case-insensitively.
453 ///
454 /// Returns \c true if the Style has been set.
455 bool getPredefinedStyle(StringRef Name, FormatStyle::LanguageKind Language,
456                         FormatStyle *Style);
457 
458 /// \brief Parse configuration from YAML-formatted text.
459 ///
460 /// Style->Language is used to get the base style, if the \c BasedOnStyle
461 /// option is present.
462 ///
463 /// When \c BasedOnStyle is not present, options not present in the YAML
464 /// document, are retained in \p Style.
465 std::error_code parseConfiguration(StringRef Text, FormatStyle *Style);
466 
467 /// \brief Gets configuration in a YAML string.
468 std::string configurationAsText(const FormatStyle &Style);
469 
470 /// \brief Reformats the given \p Ranges in the token stream coming out of
471 /// \c Lex.
472 ///
473 /// Each range is extended on either end to its next bigger logic unit, i.e.
474 /// everything that might influence its formatting or might be influenced by its
475 /// formatting.
476 ///
477 /// Returns the \c Replacements necessary to make all \p Ranges comply with
478 /// \p Style.
479 tooling::Replacements reformat(const FormatStyle &Style, Lexer &Lex,
480                                SourceManager &SourceMgr,
481                                std::vector<CharSourceRange> Ranges);
482 
483 /// \brief Reformats the given \p Ranges in \p Code.
484 ///
485 /// Otherwise identical to the reformat() function consuming a \c Lexer.
486 tooling::Replacements reformat(const FormatStyle &Style, StringRef Code,
487                                std::vector<tooling::Range> Ranges,
488                                StringRef FileName = "<stdin>");
489 
490 /// \brief Returns the \c LangOpts that the formatter expects you to set.
491 ///
492 /// \param Standard determines lexing mode: LC_Cpp11 and LS_Auto turn on C++11
493 /// lexing mode, LS_Cpp03 - C++03 mode.
494 LangOptions getFormattingLangOpts(
495     FormatStyle::LanguageStandard Standard = FormatStyle::LS_Cpp11);
496 
497 /// \brief Description to be used for help text for a llvm::cl option for
498 /// specifying format style. The description is closely related to the operation
499 /// of getStyle().
500 extern const char *StyleOptionHelpDescription;
501 
502 /// \brief Construct a FormatStyle based on \c StyleName.
503 ///
504 /// \c StyleName can take several forms:
505 /// \li "{<key>: <value>, ...}" - Set specic style parameters.
506 /// \li "<style name>" - One of the style names supported by
507 /// getPredefinedStyle().
508 /// \li "file" - Load style configuration from a file called '.clang-format'
509 /// located in one of the parent directories of \c FileName or the current
510 /// directory if \c FileName is empty.
511 ///
512 /// \param[in] StyleName Style name to interpret according to the description
513 /// above.
514 /// \param[in] FileName Path to start search for .clang-format if \c StyleName
515 /// == "file".
516 /// \param[in] FallbackStyle The name of a predefined style used to fallback to
517 /// in case the style can't be determined from \p StyleName.
518 ///
519 /// \returns FormatStyle as specified by \c StyleName. If no style could be
520 /// determined, the default is LLVM Style (see getLLVMStyle()).
521 FormatStyle getStyle(StringRef StyleName, StringRef FileName,
522                      StringRef FallbackStyle);
523 
524 } // end namespace format
525 } // end namespace clang
526 
527 namespace std {
528 template <>
529 struct is_error_code_enum<clang::format::ParseError> : std::true_type {};
530 }
531 
532 #endif // LLVM_CLANG_FORMAT_FORMAT_H
533