• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Copyright 2012 The Chromium Authors
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4 
5 // This class works with command lines: building and parsing.
6 // Arguments with prefixes ('--', '-', and on Windows, '/') are switches.
7 // Switches will precede all other arguments without switch prefixes.
8 // Switches can optionally have values, delimited by '=', e.g., "-switch=value".
9 // If a switch is specified multiple times, only the last value is used.
10 // An argument of "--" will terminate switch parsing during initialization,
11 // interpreting subsequent tokens as non-switch arguments, regardless of prefix.
12 
13 // There is a singleton read-only CommandLine that represents the command line
14 // that the current process was started with.  It must be initialized in main().
15 
16 #ifndef BASE_COMMAND_LINE_H_
17 #define BASE_COMMAND_LINE_H_
18 
19 #include <stddef.h>
20 #include <functional>
21 #include <map>
22 #include <memory>
23 #include <string>
24 #include <vector>
25 
26 #include "base/base_export.h"
27 #include "base/debug/debugging_buildflags.h"
28 #include "base/strings/string_piece.h"
29 #include "build/build_config.h"
30 
31 #if BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS)
32 #include "base/sequence_checker.h"
33 #endif  // BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS)
34 
35 namespace base {
36 
37 class DuplicateSwitchHandler;
38 class FilePath;
39 
40 class BASE_EXPORT CommandLine {
41  public:
42 #if BUILDFLAG(IS_WIN)
43   // The native command line string type.
44   using StringType = std::wstring;
45 #elif BUILDFLAG(IS_POSIX) || BUILDFLAG(IS_FUCHSIA)
46   using StringType = std::string;
47 #endif
48 
49   using CharType = StringType::value_type;
50   using StringPieceType = base::BasicStringPiece<CharType>;
51   using StringVector = std::vector<StringType>;
52   using SwitchMap = std::map<std::string, StringType, std::less<>>;
53 
54   // A constructor for CommandLines that only carry switches and arguments.
55   enum NoProgram { NO_PROGRAM };
56   explicit CommandLine(NoProgram no_program);
57 
58   // Construct a new command line with |program| as argv[0].
59   explicit CommandLine(const FilePath& program);
60 
61   // Construct a new command line from an argument list.
62   CommandLine(int argc, const CharType* const* argv);
63   explicit CommandLine(const StringVector& argv);
64 
65   // Allow the copy constructor. A common pattern is to copy of the current
66   // process's command line and then add some flags to it. For example:
67   //   CommandLine cl(*CommandLine::ForCurrentProcess());
68   //   cl.AppendSwitch(...);
69   CommandLine(const CommandLine& other);
70   CommandLine& operator=(const CommandLine& other);
71 
72   ~CommandLine();
73 
74 #if BUILDFLAG(IS_WIN)
75   // By default this class will treat command-line arguments beginning with
76   // slashes as switches on Windows, but not other platforms.
77   //
78   // If this behavior is inappropriate for your application, you can call this
79   // function BEFORE initializing the current process' global command line
80   // object and the behavior will be the same as Posix systems (only hyphens
81   // begin switches, everything else will be an arg).
82   static void set_slash_is_not_a_switch();
83 
84   // Normally when the CommandLine singleton is initialized it gets the command
85   // line via the GetCommandLineW API and then uses the shell32 API
86   // CommandLineToArgvW to parse the command line and convert it back to
87   // argc and argv. Tests who don't want this dependency on shell32 and need
88   // to honor the arguments passed in should use this function.
89   static void InitUsingArgvForTesting(int argc, const char* const* argv);
90 #endif
91 
92   // Initialize the current process CommandLine singleton. On Windows, ignores
93   // its arguments (we instead parse GetCommandLineW() directly) because we
94   // don't trust the CRT's parsing of the command line, but it still must be
95   // called to set up the command line. Returns false if initialization has
96   // already occurred, and true otherwise. Only the caller receiving a 'true'
97   // return value should take responsibility for calling Reset.
98   static bool Init(int argc, const char* const* argv);
99 
100   // Destroys the current process CommandLine singleton. This is necessary if
101   // you want to reset the base library to its initial state (for example, in an
102   // outer library that needs to be able to terminate, and be re-initialized).
103   // If Init is called only once, as in main(), Reset() is not necessary.
104   // Do not call this in tests. Use base::test::ScopedCommandLine instead.
105   static void Reset();
106 
107   // Get the singleton CommandLine representing the current process's
108   // command line. Note: returned value is mutable, but not thread safe;
109   // only mutate if you know what you're doing!
110   static CommandLine* ForCurrentProcess();
111 
112   // Returns true if the CommandLine has been initialized for the given process.
113   static bool InitializedForCurrentProcess();
114 
115 #if BUILDFLAG(IS_WIN)
116   static CommandLine FromString(StringPieceType command_line);
117 #endif
118 
119   // Initialize from an argv vector.
120   void InitFromArgv(int argc, const CharType* const* argv);
121   void InitFromArgv(const StringVector& argv);
122 
123   // Constructs and returns the represented command line string.
124   // CAUTION! This should be avoided on POSIX because quoting behavior is
125   // unclear.
126   // CAUTION! If writing a command line to the Windows registry, use
127   // GetCommandLineStringForShell() instead.
128   StringType GetCommandLineString() const;
129 
130 #if BUILDFLAG(IS_WIN)
131   // Quotes and escapes `arg` if necessary so that it will be interpreted as a
132   // single command-line parameter according to the following rules in line with
133   // `::CommandLineToArgvW` and C++ `main`:
134   // * Returns `arg` unchanged if `arg` does not include any characters that may
135   // need encoding, which is spaces, tabs, backslashes, and double-quotes.
136   // * Otherwise, double-quotes `arg` and in addition:
137   //   * Escapes any double-quotes in `arg` with backslashes.
138   //   * Escapes backslashes in `arg` if:
139   //     * `arg` ends with backslashes , or
140   //     * the backslashes end in a pre-existing double quote.
141   //
142   // https://learn.microsoft.com/en-us/search/?terms=CommandLineToArgvW and
143   // http://msdn.microsoft.com/en-us/library/17w5ykft.aspx#parsing-c-command-line-arguments.
144   static std::wstring QuoteForCommandLineToArgvW(const std::wstring& arg);
145 
146   // Returns the command-line string in the proper format for the Windows shell,
147   // ending with the argument placeholder "--single-argument %1". The single-
148   // argument switch prevents unexpected parsing of arguments from other
149   // software that cannot be trusted to escape double quotes when substituting
150   // into a placeholder (e.g., "%1" insert sequences populated by the Windows
151   // shell).
152   // NOTE: this must be used to generate the command-line string for the shell
153   // even if this command line was parsed from a string with the proper syntax,
154   // because the --single-argument switch is not preserved during parsing.
155   StringType GetCommandLineStringForShell() const;
156 
157   // Returns the represented command-line string. Allows the use of unsafe
158   // Windows insert sequences like "%1". Only use this method if
159   // GetCommandLineStringForShell() is not adequate AND the processor inserting
160   // the arguments is known to do so securely (i.e., is not the Windows shell).
161   // If in doubt, do not use.
162   StringType GetCommandLineStringWithUnsafeInsertSequences() const;
163 #endif
164 
165   // Constructs and returns the represented arguments string.
166   // CAUTION! This should be avoided on POSIX because quoting behavior is
167   // unclear.
168   StringType GetArgumentsString() const;
169 
170   // Returns the original command line string as a vector of strings.
argv()171   const StringVector& argv() const { return argv_; }
172 
173   // Get and Set the program part of the command line string (the first item).
174   FilePath GetProgram() const;
175   void SetProgram(const FilePath& program);
176 
177   // Returns true if this command line contains the given switch.
178   // Switch names must be lowercase.
179   // The second override provides an optimized version to avoid inlining codegen
180   // at every callsite to find the length of the constant and construct a
181   // StringPiece.
182   bool HasSwitch(StringPiece switch_string) const;
183   bool HasSwitch(const char switch_constant[]) const;
184 
185   // Returns the value associated with the given switch. If the switch has no
186   // value or isn't present, this method returns the empty string.
187   // Switch names must be lowercase.
188   std::string GetSwitchValueASCII(StringPiece switch_string) const;
189   FilePath GetSwitchValuePath(StringPiece switch_string) const;
190   StringType GetSwitchValueNative(StringPiece switch_string) const;
191 
192   // Get a copy of all switches, along with their values.
GetSwitches()193   const SwitchMap& GetSwitches() const { return switches_; }
194 
195   // Append a switch [with optional value] to the command line.
196   // Note: Switches will precede arguments regardless of appending order.
197   void AppendSwitch(StringPiece switch_string);
198   void AppendSwitchPath(StringPiece switch_string, const FilePath& path);
199   void AppendSwitchNative(StringPiece switch_string, StringPieceType value);
200   void AppendSwitchASCII(StringPiece switch_string, StringPiece value);
201 
202   // Removes the switch that matches |switch_key_without_prefix|, regardless of
203   // prefix and value. If no such switch is present, this has no effect.
204   void RemoveSwitch(const base::StringPiece switch_key_without_prefix);
205 
206   // Copy a set of switches (and any values) from another command line.
207   // Commonly used when launching a subprocess.
208   void CopySwitchesFrom(const CommandLine& source,
209                         const char* const switches[],
210                         size_t count);
211 
212   // Get the remaining arguments to the command.
213   StringVector GetArgs() const;
214 
215   // Append an argument to the command line. Note that the argument is quoted
216   // properly such that it is interpreted as one argument to the target command.
217   // AppendArg is primarily for ASCII; non-ASCII input is interpreted as UTF-8.
218   // Note: Switches will precede arguments regardless of appending order.
219   void AppendArg(StringPiece value);
220   void AppendArgPath(const FilePath& value);
221   void AppendArgNative(StringPieceType value);
222 
223   // Append the switches and arguments from another command line to this one.
224   // If |include_program| is true, include |other|'s program as well.
225   void AppendArguments(const CommandLine& other, bool include_program);
226 
227   // Insert a command before the current command.
228   // Common for debuggers, like "gdb --args".
229   void PrependWrapper(StringPieceType wrapper);
230 
231 #if BUILDFLAG(IS_WIN)
232   // Initialize by parsing the given command line string.
233   // The program name is assumed to be the first item in the string.
234   void ParseFromString(StringPieceType command_line);
235 
236   // Returns true if the command line had the --single-argument switch, and
237   // thus likely came from a Windows shell registration. This is only set if the
238   // command line is parsed, and is not changed after it is parsed.
HasSingleArgumentSwitch()239   bool HasSingleArgumentSwitch() const { return has_single_argument_switch_; }
240 #endif
241 
242   // Detaches this object from the current sequence in preparation for a move to
243   // a different sequence.
244   void DetachFromCurrentSequence();
245 
246   // Sets a delegate that's called when we encounter a duplicate switch
247   static void SetDuplicateSwitchHandler(
248       std::unique_ptr<DuplicateSwitchHandler>);
249 
250  private:
251 #if BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS)
252   // A helper class that encapsulates a SEQUENCE_CHECKER but allows copy.
253   // Copying this class will detach the sequence checker from the owning object.
254   class InstanceBoundSequenceChecker {
255    public:
256     InstanceBoundSequenceChecker() = default;
257 
InstanceBoundSequenceChecker(const InstanceBoundSequenceChecker & other)258     InstanceBoundSequenceChecker(const InstanceBoundSequenceChecker& other) {}
259 
260     InstanceBoundSequenceChecker& operator=(
261         const InstanceBoundSequenceChecker& other) {
262       return *this;
263     }
264 
265     // Disallow move.
266     InstanceBoundSequenceChecker(InstanceBoundSequenceChecker&&) = delete;
267     InstanceBoundSequenceChecker& operator=(InstanceBoundSequenceChecker&&) =
268         delete;
269 
Detach()270     void Detach() { DETACH_FROM_SEQUENCE(sequence_checker_); }
Check()271     void Check() { DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_); }
272 
273    private:
274     SEQUENCE_CHECKER(sequence_checker_);
275   };
276 #endif  // BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS)
277 
278   // Disallow default constructor; a program name must be explicitly specified.
279   CommandLine() = delete;
280 
281   // Append switches and arguments, keeping switches before arguments.
282   void AppendSwitchesAndArguments(const StringVector& argv);
283 
284   // Internal version of GetArgumentsString to support allowing unsafe insert
285   // sequences in rare cases (see
286   // GetCommandLineStringWithUnsafeInsertSequences).
287   StringType GetArgumentsStringInternal(
288       bool allow_unsafe_insert_sequences) const;
289 
290 #if BUILDFLAG(IS_WIN)
291   // Initializes by parsing |raw_command_line_string_|, treating everything
292   // after |single_arg_switch_string| + <a single character> as the command
293   // line's single argument, and dropping any arguments previously parsed. The
294   // command line must contain |single_arg_switch_string|, and the argument, if
295   // present, must be separated from |single_arg_switch_string| by one
296   // character.
297   // NOTE: the single-argument switch is not preserved after parsing;
298   // GetCommandLineStringForShell() must be used to reproduce the original
299   // command-line string with single-argument switch.
300   void ParseAsSingleArgument(const StringType& single_arg_switch_string);
301 
302   // The string returned by GetCommandLineW(), to be parsed via
303   // ParseFromString(). Empty if this command line was not parsed from a string,
304   // or if ParseFromString() has finished executing.
305   StringPieceType raw_command_line_string_;
306 
307   // Set to true if the command line had --single-argument when initially
308   // parsed. It does not change if the command line mutates after initial
309   // parsing.
310   bool has_single_argument_switch_ = false;
311 #endif
312 
313   // The singleton CommandLine representing the current process's command line.
314   static CommandLine* current_process_commandline_;
315 
316   // The argv array: { program, [(--|-|/)switch[=value]]*, [--], [argument]* }
317   StringVector argv_;
318 
319   // Parsed-out switch keys and values.
320   SwitchMap switches_;
321 
322   // The index after the program and switches, any arguments start here.
323   ptrdiff_t begin_args_;
324 
325 #if BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS)
326   InstanceBoundSequenceChecker sequence_checker_;
327 #endif
328 };
329 
330 class BASE_EXPORT DuplicateSwitchHandler {
331  public:
332   // out_value contains the existing value of the switch
333   virtual void ResolveDuplicate(base::StringPiece key,
334                                 CommandLine::StringPieceType new_value,
335                                 CommandLine::StringType& out_value) = 0;
336   virtual ~DuplicateSwitchHandler() = default;
337 };
338 
339 }  // namespace base
340 
341 #endif  // BASE_COMMAND_LINE_H_
342