1 // Copyright 2012 The Chromium Authors 2 // Use of this source code is governed by a BSD-style license that can be 3 // found in the LICENSE file. 4 5 // This class works with command lines: building and parsing. 6 // Arguments with prefixes ('--', '-', and on Windows, '/') are switches. 7 // Switches will precede all other arguments without switch prefixes. 8 // Switches can optionally have values, delimited by '=', e.g., "-switch=value". 9 // If a switch is specified multiple times, only the last value is used. 10 // An argument of "--" will terminate switch parsing during initialization, 11 // interpreting subsequent tokens as non-switch arguments, regardless of prefix. 12 13 // There is a singleton read-only CommandLine that represents the command line 14 // that the current process was started with. It must be initialized in main(). 15 16 #ifndef BASE_COMMAND_LINE_H_ 17 #define BASE_COMMAND_LINE_H_ 18 19 #include <stddef.h> 20 #include <functional> 21 #include <map> 22 #include <memory> 23 #include <string> 24 #include <vector> 25 26 #include "base/base_export.h" 27 #include "base/debug/debugging_buildflags.h" 28 #include "base/strings/string_piece.h" 29 #include "build/build_config.h" 30 31 #if BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS) 32 #include "base/sequence_checker.h" 33 #endif // BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS) 34 35 namespace base { 36 37 class DuplicateSwitchHandler; 38 class FilePath; 39 40 class BASE_EXPORT CommandLine { 41 public: 42 #if BUILDFLAG(IS_WIN) 43 // The native command line string type. 44 using StringType = std::wstring; 45 #elif BUILDFLAG(IS_POSIX) || BUILDFLAG(IS_FUCHSIA) 46 using StringType = std::string; 47 #endif 48 49 using CharType = StringType::value_type; 50 using StringPieceType = base::BasicStringPiece<CharType>; 51 using StringVector = std::vector<StringType>; 52 using SwitchMap = std::map<std::string, StringType, std::less<>>; 53 54 // A constructor for CommandLines that only carry switches and arguments. 55 enum NoProgram { NO_PROGRAM }; 56 explicit CommandLine(NoProgram no_program); 57 58 // Construct a new command line with |program| as argv[0]. 59 explicit CommandLine(const FilePath& program); 60 61 // Construct a new command line from an argument list. 62 CommandLine(int argc, const CharType* const* argv); 63 explicit CommandLine(const StringVector& argv); 64 65 // Allow the copy constructor. A common pattern is to copy of the current 66 // process's command line and then add some flags to it. For example: 67 // CommandLine cl(*CommandLine::ForCurrentProcess()); 68 // cl.AppendSwitch(...); 69 CommandLine(const CommandLine& other); 70 CommandLine& operator=(const CommandLine& other); 71 72 ~CommandLine(); 73 74 #if BUILDFLAG(IS_WIN) 75 // By default this class will treat command-line arguments beginning with 76 // slashes as switches on Windows, but not other platforms. 77 // 78 // If this behavior is inappropriate for your application, you can call this 79 // function BEFORE initializing the current process' global command line 80 // object and the behavior will be the same as Posix systems (only hyphens 81 // begin switches, everything else will be an arg). 82 static void set_slash_is_not_a_switch(); 83 84 // Normally when the CommandLine singleton is initialized it gets the command 85 // line via the GetCommandLineW API and then uses the shell32 API 86 // CommandLineToArgvW to parse the command line and convert it back to 87 // argc and argv. Tests who don't want this dependency on shell32 and need 88 // to honor the arguments passed in should use this function. 89 static void InitUsingArgvForTesting(int argc, const char* const* argv); 90 #endif 91 92 // Initialize the current process CommandLine singleton. On Windows, ignores 93 // its arguments (we instead parse GetCommandLineW() directly) because we 94 // don't trust the CRT's parsing of the command line, but it still must be 95 // called to set up the command line. Returns false if initialization has 96 // already occurred, and true otherwise. Only the caller receiving a 'true' 97 // return value should take responsibility for calling Reset. 98 static bool Init(int argc, const char* const* argv); 99 100 // Destroys the current process CommandLine singleton. This is necessary if 101 // you want to reset the base library to its initial state (for example, in an 102 // outer library that needs to be able to terminate, and be re-initialized). 103 // If Init is called only once, as in main(), Reset() is not necessary. 104 // Do not call this in tests. Use base::test::ScopedCommandLine instead. 105 static void Reset(); 106 107 // Get the singleton CommandLine representing the current process's 108 // command line. Note: returned value is mutable, but not thread safe; 109 // only mutate if you know what you're doing! 110 static CommandLine* ForCurrentProcess(); 111 112 // Returns true if the CommandLine has been initialized for the given process. 113 static bool InitializedForCurrentProcess(); 114 115 #if BUILDFLAG(IS_WIN) 116 static CommandLine FromString(StringPieceType command_line); 117 #endif 118 119 // Initialize from an argv vector. 120 void InitFromArgv(int argc, const CharType* const* argv); 121 void InitFromArgv(const StringVector& argv); 122 123 // Constructs and returns the represented command line string. 124 // CAUTION! This should be avoided on POSIX because quoting behavior is 125 // unclear. 126 // CAUTION! If writing a command line to the Windows registry, use 127 // GetCommandLineStringForShell() instead. 128 StringType GetCommandLineString() const; 129 130 #if BUILDFLAG(IS_WIN) 131 // Quotes and escapes `arg` if necessary so that it will be interpreted as a 132 // single command-line parameter according to the following rules in line with 133 // `::CommandLineToArgvW` and C++ `main`: 134 // * Returns `arg` unchanged if `arg` does not include any characters that may 135 // need encoding, which is spaces, tabs, backslashes, and double-quotes. 136 // * Otherwise, double-quotes `arg` and in addition: 137 // * Escapes any double-quotes in `arg` with backslashes. 138 // * Escapes backslashes in `arg` if: 139 // * `arg` ends with backslashes , or 140 // * the backslashes end in a pre-existing double quote. 141 // 142 // https://learn.microsoft.com/en-us/search/?terms=CommandLineToArgvW and 143 // http://msdn.microsoft.com/en-us/library/17w5ykft.aspx#parsing-c-command-line-arguments. 144 static std::wstring QuoteForCommandLineToArgvW(const std::wstring& arg); 145 146 // Returns the command-line string in the proper format for the Windows shell, 147 // ending with the argument placeholder "--single-argument %1". The single- 148 // argument switch prevents unexpected parsing of arguments from other 149 // software that cannot be trusted to escape double quotes when substituting 150 // into a placeholder (e.g., "%1" insert sequences populated by the Windows 151 // shell). 152 // NOTE: this must be used to generate the command-line string for the shell 153 // even if this command line was parsed from a string with the proper syntax, 154 // because the --single-argument switch is not preserved during parsing. 155 StringType GetCommandLineStringForShell() const; 156 157 // Returns the represented command-line string. Allows the use of unsafe 158 // Windows insert sequences like "%1". Only use this method if 159 // GetCommandLineStringForShell() is not adequate AND the processor inserting 160 // the arguments is known to do so securely (i.e., is not the Windows shell). 161 // If in doubt, do not use. 162 StringType GetCommandLineStringWithUnsafeInsertSequences() const; 163 #endif 164 165 // Constructs and returns the represented arguments string. 166 // CAUTION! This should be avoided on POSIX because quoting behavior is 167 // unclear. 168 StringType GetArgumentsString() const; 169 170 // Returns the original command line string as a vector of strings. argv()171 const StringVector& argv() const { return argv_; } 172 173 // Get and Set the program part of the command line string (the first item). 174 FilePath GetProgram() const; 175 void SetProgram(const FilePath& program); 176 177 // Returns true if this command line contains the given switch. 178 // Switch names must be lowercase. 179 // The second override provides an optimized version to avoid inlining codegen 180 // at every callsite to find the length of the constant and construct a 181 // StringPiece. 182 bool HasSwitch(StringPiece switch_string) const; 183 bool HasSwitch(const char switch_constant[]) const; 184 185 // Returns the value associated with the given switch. If the switch has no 186 // value or isn't present, this method returns the empty string. 187 // Switch names must be lowercase. 188 std::string GetSwitchValueASCII(StringPiece switch_string) const; 189 FilePath GetSwitchValuePath(StringPiece switch_string) const; 190 StringType GetSwitchValueNative(StringPiece switch_string) const; 191 192 // Get a copy of all switches, along with their values. GetSwitches()193 const SwitchMap& GetSwitches() const { return switches_; } 194 195 // Append a switch [with optional value] to the command line. 196 // Note: Switches will precede arguments regardless of appending order. 197 void AppendSwitch(StringPiece switch_string); 198 void AppendSwitchPath(StringPiece switch_string, const FilePath& path); 199 void AppendSwitchNative(StringPiece switch_string, StringPieceType value); 200 void AppendSwitchASCII(StringPiece switch_string, StringPiece value); 201 202 // Removes the switch that matches |switch_key_without_prefix|, regardless of 203 // prefix and value. If no such switch is present, this has no effect. 204 void RemoveSwitch(const base::StringPiece switch_key_without_prefix); 205 206 // Copy a set of switches (and any values) from another command line. 207 // Commonly used when launching a subprocess. 208 void CopySwitchesFrom(const CommandLine& source, 209 const char* const switches[], 210 size_t count); 211 212 // Get the remaining arguments to the command. 213 StringVector GetArgs() const; 214 215 // Append an argument to the command line. Note that the argument is quoted 216 // properly such that it is interpreted as one argument to the target command. 217 // AppendArg is primarily for ASCII; non-ASCII input is interpreted as UTF-8. 218 // Note: Switches will precede arguments regardless of appending order. 219 void AppendArg(StringPiece value); 220 void AppendArgPath(const FilePath& value); 221 void AppendArgNative(StringPieceType value); 222 223 // Append the switches and arguments from another command line to this one. 224 // If |include_program| is true, include |other|'s program as well. 225 void AppendArguments(const CommandLine& other, bool include_program); 226 227 // Insert a command before the current command. 228 // Common for debuggers, like "gdb --args". 229 void PrependWrapper(StringPieceType wrapper); 230 231 #if BUILDFLAG(IS_WIN) 232 // Initialize by parsing the given command line string. 233 // The program name is assumed to be the first item in the string. 234 void ParseFromString(StringPieceType command_line); 235 236 // Returns true if the command line had the --single-argument switch, and 237 // thus likely came from a Windows shell registration. This is only set if the 238 // command line is parsed, and is not changed after it is parsed. HasSingleArgumentSwitch()239 bool HasSingleArgumentSwitch() const { return has_single_argument_switch_; } 240 #endif 241 242 // Detaches this object from the current sequence in preparation for a move to 243 // a different sequence. 244 void DetachFromCurrentSequence(); 245 246 // Sets a delegate that's called when we encounter a duplicate switch 247 static void SetDuplicateSwitchHandler( 248 std::unique_ptr<DuplicateSwitchHandler>); 249 250 private: 251 #if BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS) 252 // A helper class that encapsulates a SEQUENCE_CHECKER but allows copy. 253 // Copying this class will detach the sequence checker from the owning object. 254 class InstanceBoundSequenceChecker { 255 public: 256 InstanceBoundSequenceChecker() = default; 257 InstanceBoundSequenceChecker(const InstanceBoundSequenceChecker & other)258 InstanceBoundSequenceChecker(const InstanceBoundSequenceChecker& other) {} 259 260 InstanceBoundSequenceChecker& operator=( 261 const InstanceBoundSequenceChecker& other) { 262 return *this; 263 } 264 265 // Disallow move. 266 InstanceBoundSequenceChecker(InstanceBoundSequenceChecker&&) = delete; 267 InstanceBoundSequenceChecker& operator=(InstanceBoundSequenceChecker&&) = 268 delete; 269 Detach()270 void Detach() { DETACH_FROM_SEQUENCE(sequence_checker_); } Check()271 void Check() { DCHECK_CALLED_ON_VALID_SEQUENCE(sequence_checker_); } 272 273 private: 274 SEQUENCE_CHECKER(sequence_checker_); 275 }; 276 #endif // BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS) 277 278 // Disallow default constructor; a program name must be explicitly specified. 279 CommandLine() = delete; 280 281 // Append switches and arguments, keeping switches before arguments. 282 void AppendSwitchesAndArguments(const StringVector& argv); 283 284 // Internal version of GetArgumentsString to support allowing unsafe insert 285 // sequences in rare cases (see 286 // GetCommandLineStringWithUnsafeInsertSequences). 287 StringType GetArgumentsStringInternal( 288 bool allow_unsafe_insert_sequences) const; 289 290 #if BUILDFLAG(IS_WIN) 291 // Initializes by parsing |raw_command_line_string_|, treating everything 292 // after |single_arg_switch_string| + <a single character> as the command 293 // line's single argument, and dropping any arguments previously parsed. The 294 // command line must contain |single_arg_switch_string|, and the argument, if 295 // present, must be separated from |single_arg_switch_string| by one 296 // character. 297 // NOTE: the single-argument switch is not preserved after parsing; 298 // GetCommandLineStringForShell() must be used to reproduce the original 299 // command-line string with single-argument switch. 300 void ParseAsSingleArgument(const StringType& single_arg_switch_string); 301 302 // The string returned by GetCommandLineW(), to be parsed via 303 // ParseFromString(). Empty if this command line was not parsed from a string, 304 // or if ParseFromString() has finished executing. 305 StringPieceType raw_command_line_string_; 306 307 // Set to true if the command line had --single-argument when initially 308 // parsed. It does not change if the command line mutates after initial 309 // parsing. 310 bool has_single_argument_switch_ = false; 311 #endif 312 313 // The singleton CommandLine representing the current process's command line. 314 static CommandLine* current_process_commandline_; 315 316 // The argv array: { program, [(--|-|/)switch[=value]]*, [--], [argument]* } 317 StringVector argv_; 318 319 // Parsed-out switch keys and values. 320 SwitchMap switches_; 321 322 // The index after the program and switches, any arguments start here. 323 ptrdiff_t begin_args_; 324 325 #if BUILDFLAG(ENABLE_COMMANDLINE_SEQUENCE_CHECKS) 326 InstanceBoundSequenceChecker sequence_checker_; 327 #endif 328 }; 329 330 class BASE_EXPORT DuplicateSwitchHandler { 331 public: 332 // out_value contains the existing value of the switch 333 virtual void ResolveDuplicate(base::StringPiece key, 334 CommandLine::StringPieceType new_value, 335 CommandLine::StringType& out_value) = 0; 336 virtual ~DuplicateSwitchHandler() = default; 337 }; 338 339 } // namespace base 340 341 #endif // BASE_COMMAND_LINE_H_ 342