1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
4
5 #include "base/command_line.h"
6
7 #include <algorithm>
8 #include <iterator>
9 #include <ostream>
10 #include <string_view>
11
12 #include "base/files/file_path.h"
13 #include "base/logging.h"
14 #include "base/stl_util.h"
15 #include "base/strings/string_split.h"
16 #include "base/strings/string_tokenizer.h"
17 #include "base/strings/string_util.h"
18 #include "base/strings/utf_string_conversions.h"
19 #include "util/build_config.h"
20
21 #if defined(OS_WIN)
22 #include <windows.h>
23
24 #include <shellapi.h>
25 #endif
26
27 namespace base {
28
29 CommandLine* CommandLine::current_process_commandline_ = nullptr;
30
31 namespace {
32
33 const CommandLine::CharType kSwitchTerminator[] = FILE_PATH_LITERAL("--");
34 const CommandLine::CharType kSwitchValueSeparator[] = FILE_PATH_LITERAL("=");
35
36 // Since we use a lazy match, make sure that longer versions (like "--") are
37 // listed before shorter versions (like "-") of similar prefixes.
38 #if defined(OS_WIN)
39 // By putting slash last, we can control whether it is treaded as a switch
40 // value by changing the value of switch_prefix_count to be one less than
41 // the array size.
42 const CommandLine::CharType* const kSwitchPrefixes[] = {u"--", u"-", u"/"};
43 #elif defined(OS_POSIX) || defined(OS_FUCHSIA)
44 // Unixes don't use slash as a switch.
45 const CommandLine::CharType* const kSwitchPrefixes[] = {"--", "-"};
46 #endif
47 size_t switch_prefix_count = std::size(kSwitchPrefixes);
48
GetSwitchPrefixLength(const CommandLine::StringType & string)49 size_t GetSwitchPrefixLength(const CommandLine::StringType& string) {
50 for (size_t i = 0; i < switch_prefix_count; ++i) {
51 CommandLine::StringType prefix(kSwitchPrefixes[i]);
52 if (string.compare(0, prefix.length(), prefix) == 0)
53 return prefix.length();
54 }
55 return 0;
56 }
57
58 // Fills in |switch_string| and |switch_value| if |string| is a switch.
59 // This will preserve the input switch prefix in the output |switch_string|.
IsSwitch(const CommandLine::StringType & string,CommandLine::StringType * switch_string,CommandLine::StringType * switch_value)60 bool IsSwitch(const CommandLine::StringType& string,
61 CommandLine::StringType* switch_string,
62 CommandLine::StringType* switch_value) {
63 switch_string->clear();
64 switch_value->clear();
65 size_t prefix_length = GetSwitchPrefixLength(string);
66 if (prefix_length == 0 || prefix_length == string.length())
67 return false;
68
69 const size_t equals_position = string.find(kSwitchValueSeparator);
70 *switch_string = string.substr(0, equals_position);
71 if (equals_position != CommandLine::StringType::npos)
72 *switch_value = string.substr(equals_position + 1);
73 return true;
74 }
75
76 // Append switches and arguments, keeping switches before arguments
77 // if handle_switches is true.
AppendSwitchesAndArguments(CommandLine * command_line,const CommandLine::StringVector & argv,bool handle_switches)78 void AppendSwitchesAndArguments(CommandLine* command_line,
79 const CommandLine::StringVector& argv,
80 bool handle_switches) {
81 bool parse_switches = handle_switches;
82 for (size_t i = 1; i < argv.size(); ++i) {
83 CommandLine::StringType arg = argv[i];
84 #if defined(OS_WIN)
85 TrimWhitespace(arg, TRIM_ALL, &arg);
86 #elif defined(OS_POSIX) || defined(OS_FUCHSIA)
87 TrimWhitespaceASCII(arg, TRIM_ALL, &arg);
88 #endif
89
90 CommandLine::StringType switch_string;
91 CommandLine::StringType switch_value;
92 parse_switches &= (arg != kSwitchTerminator);
93 if (parse_switches && IsSwitch(arg, &switch_string, &switch_value)) {
94 #if defined(OS_WIN)
95 command_line->AppendSwitchNative(UTF16ToASCII(switch_string),
96 switch_value);
97 #elif defined(OS_POSIX) || defined(OS_FUCHSIA)
98 command_line->AppendSwitchNative(switch_string, switch_value);
99 #else
100 #error Unsupported platform
101 #endif
102 } else {
103 command_line->AppendArgNative(arg);
104 }
105 }
106 }
107
108 #if defined(OS_WIN)
109 // Quote a string as necessary for CommandLineToArgvW compatibility *on
110 // Windows*.
QuoteForCommandLineToArgvW(const std::u16string & arg,bool quote_placeholders)111 std::u16string QuoteForCommandLineToArgvW(const std::u16string& arg,
112 bool quote_placeholders) {
113 // We follow the quoting rules of CommandLineToArgvW.
114 // http://msdn.microsoft.com/en-us/library/17w5ykft.aspx
115 std::u16string quotable_chars(u" \\\"");
116 // We may also be required to quote '%', which is commonly used in a command
117 // line as a placeholder. (It may be substituted for a string with spaces.)
118 if (quote_placeholders)
119 quotable_chars.push_back('%');
120 if (arg.find_first_of(quotable_chars) == std::u16string::npos) {
121 // No quoting necessary.
122 return arg;
123 }
124
125 std::u16string out;
126 out.push_back('"');
127 for (size_t i = 0; i < arg.size(); ++i) {
128 if (arg[i] == '\\') {
129 // Find the extent of this run of backslashes.
130 size_t start = i, end = start + 1;
131 for (; end < arg.size() && arg[end] == '\\'; ++end) {
132 }
133 size_t backslash_count = end - start;
134
135 // Backslashes are escapes only if the run is followed by a double quote.
136 // Since we also will end the string with a double quote, we escape for
137 // either a double quote or the end of the string.
138 if (end == arg.size() || arg[end] == '"') {
139 // To quote, we need to output 2x as many backslashes.
140 backslash_count *= 2;
141 }
142 for (size_t j = 0; j < backslash_count; ++j)
143 out.push_back('\\');
144
145 // Advance i to one before the end to balance i++ in loop.
146 i = end - 1;
147 } else if (arg[i] == '"') {
148 out.push_back('\\');
149 out.push_back('"');
150 } else {
151 out.push_back(arg[i]);
152 }
153 }
154 out.push_back('"');
155
156 return out;
157 }
158 #endif
159
160 } // namespace
161
CommandLine(NoProgram no_program)162 CommandLine::CommandLine(NoProgram no_program)
163 : argv_(1), begin_args_(1), parse_switches_(true) {}
164
CommandLine(const FilePath & program)165 CommandLine::CommandLine(const FilePath& program)
166 : argv_(1), begin_args_(1), parse_switches_(true) {
167 SetProgram(program);
168 }
169
CommandLine(int argc,const CommandLine::CharType * const * argv)170 CommandLine::CommandLine(int argc, const CommandLine::CharType* const* argv)
171 : argv_(1), begin_args_(1), parse_switches_(true) {
172 InitFromArgv(argc, argv);
173 }
174
CommandLine(const StringVector & argv)175 CommandLine::CommandLine(const StringVector& argv)
176 : argv_(1), begin_args_(1), parse_switches_(true) {
177 InitFromArgv(argv);
178 }
179
180 CommandLine::CommandLine(const CommandLine& other) = default;
181
182 CommandLine& CommandLine::operator=(const CommandLine& other) = default;
183
184 CommandLine::~CommandLine() = default;
185
186 #if defined(OS_WIN)
187
188 // static
StringTypeToUTF8(const StringType & input)189 std::string CommandLine::StringTypeToUTF8(const StringType& input) {
190 return UTF16ToUTF8(input);
191 }
192
193 // static
UTF8ToStringType(std::string_view input)194 CommandLine::StringType CommandLine::UTF8ToStringType(std::string_view input) {
195 return UTF8ToUTF16(input);
196 }
197
198 // static
set_slash_is_not_a_switch()199 void CommandLine::set_slash_is_not_a_switch() {
200 // The last switch prefix should be slash, so adjust the size to skip it.
201 DCHECK(std::u16string_view(kSwitchPrefixes[std::size(kSwitchPrefixes) - 1]) ==
202 std::u16string_view(u"/"));
203 switch_prefix_count = std::size(kSwitchPrefixes) - 1;
204 }
205
206 // static
InitUsingArgvForTesting(int argc,const char * const * argv)207 void CommandLine::InitUsingArgvForTesting(int argc, const char* const* argv) {
208 DCHECK(!current_process_commandline_);
209 current_process_commandline_ = new CommandLine(NO_PROGRAM);
210 // On Windows we need to convert the command line arguments to std::u16string.
211 base::CommandLine::StringVector argv_vector;
212 for (int i = 0; i < argc; ++i)
213 argv_vector.push_back(UTF8ToUTF16(argv[i]));
214 current_process_commandline_->InitFromArgv(argv_vector);
215 }
216
217 #else
218
219 // static
StringTypeToUTF8(const StringType & input)220 std::string CommandLine::StringTypeToUTF8(const StringType& input) {
221 return input;
222 }
223
224 // static
UTF8ToStringType(std::string_view input)225 CommandLine::StringType CommandLine::UTF8ToStringType(std::string_view input) {
226 return CommandLine::StringType(input);
227 }
228
229 #endif
230
231 // static
Init(int argc,const char * const * argv)232 bool CommandLine::Init(int argc, const char* const* argv) {
233 if (current_process_commandline_) {
234 // If this is intentional, Reset() must be called first. If we are using
235 // the shared build mode, we have to share a single object across multiple
236 // shared libraries.
237 return false;
238 }
239
240 current_process_commandline_ = new CommandLine(NO_PROGRAM);
241 #if defined(OS_WIN)
242 current_process_commandline_->ParseFromString(
243 reinterpret_cast<const char16_t*>(::GetCommandLineW()));
244 #elif defined(OS_POSIX) || defined(OS_FUCHSIA)
245 current_process_commandline_->InitFromArgv(argc, argv);
246 #else
247 #error Unsupported platform
248 #endif
249
250 return true;
251 }
252
253 // static
Reset()254 void CommandLine::Reset() {
255 DCHECK(current_process_commandline_);
256 delete current_process_commandline_;
257 current_process_commandline_ = nullptr;
258 }
259
260 // static
ForCurrentProcess()261 CommandLine* CommandLine::ForCurrentProcess() {
262 DCHECK(current_process_commandline_);
263 return current_process_commandline_;
264 }
265
266 // static
InitializedForCurrentProcess()267 bool CommandLine::InitializedForCurrentProcess() {
268 return !!current_process_commandline_;
269 }
270
271 #if defined(OS_WIN)
272 // static
FromString(const std::u16string & command_line)273 CommandLine CommandLine::FromString(const std::u16string& command_line) {
274 CommandLine cmd(NO_PROGRAM);
275 cmd.ParseFromString(command_line);
276 return cmd;
277 }
278 #endif
279
InitFromArgv(int argc,const CommandLine::CharType * const * argv)280 void CommandLine::InitFromArgv(int argc,
281 const CommandLine::CharType* const* argv) {
282 StringVector new_argv;
283 for (int i = 0; i < argc; ++i)
284 new_argv.push_back(argv[i]);
285 InitFromArgv(new_argv);
286 }
287
InitFromArgv(const StringVector & argv)288 void CommandLine::InitFromArgv(const StringVector& argv) {
289 argv_ = StringVector(1);
290 switches_.clear();
291 begin_args_ = 1;
292 SetProgram(argv.empty() ? FilePath() : FilePath(argv[0]));
293 AppendSwitchesAndArguments(this, argv, parse_switches_);
294 }
295
GetProgram() const296 FilePath CommandLine::GetProgram() const {
297 return FilePath(argv_[0]);
298 }
299
SetProgram(const FilePath & program)300 void CommandLine::SetProgram(const FilePath& program) {
301 #if defined(OS_WIN)
302 TrimWhitespace(program.value(), TRIM_ALL, &argv_[0]);
303 #elif defined(OS_POSIX) || defined(OS_FUCHSIA)
304 TrimWhitespaceASCII(program.value(), TRIM_ALL, &argv_[0]);
305 #else
306 #error Unsupported platform
307 #endif
308 }
309
HasSwitch(std::string_view switch_string) const310 bool CommandLine::HasSwitch(std::string_view switch_string) const {
311 DCHECK_EQ(ToLowerASCII(switch_string), switch_string);
312 return ContainsKey(switches_, switch_string);
313 }
314
HasSwitch(const char switch_constant[]) const315 bool CommandLine::HasSwitch(const char switch_constant[]) const {
316 return HasSwitch(std::string_view(switch_constant));
317 }
318
GetSwitchValueString(std::string_view switch_string) const319 std::string CommandLine::GetSwitchValueString(
320 std::string_view switch_string) const {
321 return StringTypeToUTF8(GetSwitchValueNative(switch_string));
322 }
323
GetSwitchValuePath(std::string_view switch_string) const324 FilePath CommandLine::GetSwitchValuePath(std::string_view switch_string) const {
325 return FilePath(GetSwitchValueNative(switch_string));
326 }
327
GetSwitchValueNative(std::string_view switch_string) const328 CommandLine::StringType CommandLine::GetSwitchValueNative(
329 std::string_view switch_string) const {
330 DCHECK_EQ(ToLowerASCII(switch_string), switch_string);
331
332 // There can be multiple matches, we want to find the last one.
333 auto iter = switches_.upper_bound(switch_string);
334 if (iter == switches_.begin())
335 return StringType();
336
337 // We want the item right before the upper bound, if it's a match.
338 --iter;
339 if (iter->first == switch_string)
340 return iter->second;
341 return StringType();
342 }
343
GetSwitchValueStrings(std::string_view switch_string) const344 std::vector<std::string> CommandLine::GetSwitchValueStrings(
345 std::string_view switch_string) const {
346 std::vector<StringType> matches = GetSwitchValuesNative(switch_string);
347
348 std::vector<std::string> result;
349 result.reserve(matches.size());
350
351 for (const StringType& cur : matches) {
352 result.push_back(StringTypeToUTF8(cur));
353 }
354 return result;
355 }
356
GetSwitchValuesNative(std::string_view switch_string) const357 std::vector<CommandLine::StringType> CommandLine::GetSwitchValuesNative(
358 std::string_view switch_string) const {
359 std::vector<StringType> result;
360
361 auto [iter, end] = switches_.equal_range(switch_string);
362 while (iter != end) {
363 result.push_back(iter->second);
364 ++iter;
365 }
366
367 return result;
368 }
369
AppendSwitch(const std::string & switch_string)370 void CommandLine::AppendSwitch(const std::string& switch_string) {
371 AppendSwitchNative(switch_string, StringType());
372 }
373
AppendSwitchPath(const std::string & switch_string,const FilePath & path)374 void CommandLine::AppendSwitchPath(const std::string& switch_string,
375 const FilePath& path) {
376 AppendSwitchNative(switch_string, path.value());
377 }
378
AppendSwitchNative(const std::string & switch_string,const CommandLine::StringType & value)379 void CommandLine::AppendSwitchNative(const std::string& switch_string,
380 const CommandLine::StringType& value) {
381 #if defined(OS_WIN)
382 const std::string switch_key = ToLowerASCII(switch_string);
383 StringType combined_switch_string(ASCIIToUTF16(switch_key));
384 #elif defined(OS_POSIX) || defined(OS_FUCHSIA)
385 const std::string& switch_key = switch_string;
386 StringType combined_switch_string(switch_key);
387 #endif
388
389 size_t prefix_length = GetSwitchPrefixLength(combined_switch_string);
390 switches_.insert(make_pair(switch_key.substr(prefix_length), value));
391
392 // Preserve existing switch prefixes in |argv_|; only append one if necessary.
393 if (prefix_length == 0)
394 combined_switch_string = kSwitchPrefixes[0] + combined_switch_string;
395 if (!value.empty())
396 combined_switch_string += kSwitchValueSeparator + value;
397 // Append the switch and update the switches/arguments divider |begin_args_|.
398 argv_.insert(argv_.begin() + begin_args_++, combined_switch_string);
399 }
400
AppendSwitch(const std::string & switch_string,const std::string & value_string)401 void CommandLine::AppendSwitch(const std::string& switch_string,
402 const std::string& value_string) {
403 AppendSwitchNative(switch_string, UTF8ToStringType(value_string));
404 }
405
CopySwitchesFrom(const CommandLine & source,const char * const switches[],size_t count)406 void CommandLine::CopySwitchesFrom(const CommandLine& source,
407 const char* const switches[],
408 size_t count) {
409 for (size_t i = 0; i < count; ++i) {
410 if (source.HasSwitch(switches[i]))
411 AppendSwitchNative(switches[i], source.GetSwitchValueNative(switches[i]));
412 }
413 }
414
GetArgs() const415 CommandLine::StringVector CommandLine::GetArgs() const {
416 // Gather all arguments after the last switch (may include kSwitchTerminator).
417 StringVector args(argv_.begin() + begin_args_, argv_.end());
418 // Erase only the first kSwitchTerminator (maybe "--" is a legitimate page?)
419 StringVector::iterator switch_terminator =
420 std::find(args.begin(), args.end(), kSwitchTerminator);
421 if (switch_terminator != args.end())
422 args.erase(switch_terminator);
423 return args;
424 }
425
AppendArg(const std::string & value)426 void CommandLine::AppendArg(const std::string& value) {
427 #if defined(OS_WIN)
428 DCHECK(IsStringUTF8(value));
429 AppendArgNative(UTF8ToUTF16(value));
430 #elif defined(OS_POSIX) || defined(OS_FUCHSIA)
431 AppendArgNative(value);
432 #else
433 #error Unsupported platform
434 #endif
435 }
436
AppendArgPath(const FilePath & path)437 void CommandLine::AppendArgPath(const FilePath& path) {
438 AppendArgNative(path.value());
439 }
440
AppendArgNative(const CommandLine::StringType & value)441 void CommandLine::AppendArgNative(const CommandLine::StringType& value) {
442 argv_.push_back(value);
443 }
444
AppendArguments(const CommandLine & other,bool include_program)445 void CommandLine::AppendArguments(const CommandLine& other,
446 bool include_program) {
447 if (include_program)
448 SetProgram(other.GetProgram());
449 AppendSwitchesAndArguments(this, other.argv(), parse_switches_);
450 }
451
PrependWrapper(const CommandLine::StringType & wrapper)452 void CommandLine::PrependWrapper(const CommandLine::StringType& wrapper) {
453 if (wrapper.empty())
454 return;
455 // Split the wrapper command based on whitespace (with quoting).
456 using CommandLineTokenizer =
457 StringTokenizerT<StringType, StringType::const_iterator>;
458 CommandLineTokenizer tokenizer(wrapper, FILE_PATH_LITERAL(" "));
459 tokenizer.set_quote_chars(FILE_PATH_LITERAL("'\""));
460 std::vector<StringType> wrapper_argv;
461 while (tokenizer.GetNext())
462 wrapper_argv.emplace_back(tokenizer.token());
463
464 // Prepend the wrapper and update the switches/arguments |begin_args_|.
465 argv_.insert(argv_.begin(), wrapper_argv.begin(), wrapper_argv.end());
466 begin_args_ += wrapper_argv.size();
467 }
468
469 #if defined(OS_WIN)
ParseFromString(const std::u16string & command_line)470 void CommandLine::ParseFromString(const std::u16string& command_line) {
471 std::u16string command_line_string;
472 TrimWhitespace(command_line, TRIM_ALL, &command_line_string);
473 if (command_line_string.empty())
474 return;
475
476 int num_args = 0;
477 char16_t** args = NULL;
478 args = reinterpret_cast<char16_t**>(::CommandLineToArgvW(
479 reinterpret_cast<LPCWSTR>(command_line_string.c_str()), &num_args));
480
481 DPLOG_IF(FATAL, !args) << "CommandLineToArgvW failed on command line: "
482 << UTF16ToUTF8(command_line);
483 InitFromArgv(num_args, args);
484 LocalFree(args);
485 }
486 #endif
487
GetCommandLineStringInternal(bool quote_placeholders) const488 CommandLine::StringType CommandLine::GetCommandLineStringInternal(
489 bool quote_placeholders) const {
490 StringType string(argv_[0]);
491 #if defined(OS_WIN)
492 string = QuoteForCommandLineToArgvW(string, quote_placeholders);
493 #endif
494 StringType params(GetArgumentsStringInternal(quote_placeholders));
495 if (!params.empty()) {
496 string.append(StringType(FILE_PATH_LITERAL(" ")));
497 string.append(params);
498 }
499 return string;
500 }
501
GetArgumentsStringInternal(bool quote_placeholders) const502 CommandLine::StringType CommandLine::GetArgumentsStringInternal(
503 bool quote_placeholders) const {
504 StringType params;
505 // Append switches and arguments.
506 bool parse_switches = parse_switches_;
507 for (size_t i = 1; i < argv_.size(); ++i) {
508 StringType arg = argv_[i];
509 StringType switch_string;
510 StringType switch_value;
511 parse_switches &= arg != kSwitchTerminator;
512 if (i > 1)
513 params.append(StringType(FILE_PATH_LITERAL(" ")));
514 if (parse_switches && IsSwitch(arg, &switch_string, &switch_value)) {
515 params.append(switch_string);
516 if (!switch_value.empty()) {
517 #if defined(OS_WIN)
518 switch_value =
519 QuoteForCommandLineToArgvW(switch_value, quote_placeholders);
520 #endif
521 params.append(kSwitchValueSeparator + switch_value);
522 }
523 } else {
524 #if defined(OS_WIN)
525 arg = QuoteForCommandLineToArgvW(arg, quote_placeholders);
526 #endif
527 params.append(arg);
528 }
529 }
530 return params;
531 }
532
533 } // namespace base
534