Lines Matching +full:cmd +full:- +full:cnt +full:- +full:name

2 # SPDX-License-Identifier: GPL-2.0
5 # options --cpu and --time so that each job processes a different chunk
20 glb_prog_name = "parallel-perf.py"
41 def __init__(self, cmd, pipe_to, output_dir="."): argument
44 self.cmd = cmd
47 self.cmdout_name = f"{output_dir}/cmd.txt"
52 sh_cmd = [ shlex.quote(x) for x in self.cmd ]
53 return " ".join(self.cmd)
74 self.popen = subprocess.Popen(self.cmd, stdout=subprocess.PIPE, stderr=stderr)
78 self.popen = subprocess.Popen(self.cmd, stdout=stdout, stderr=stderr)
88 return [ f"Non-empty error file {self.stderr_name}" ]
139 x = "0" * (10 - len(x)) + x
140 return x[:len(x) - 9] + "." + x[-9:]
142 def InsertOptionAfter(cmd, option, after): argument
144 pos = cmd.index(after)
145 cmd.insert(pos + 1, option)
147 cmd.append(option)
149 def CreateWorkList(cmd, pipe_to, output_dir, cpus, time_ranges_by_cpu): argument
150 max_len = len(str(cpus[-1]))
151 cpu_dir_fmt = f"cpu-%.{max_len}u"
157 cpu_option = f"--cpu={cpu}"
162 tr_dir_fmt = "time-range"
166 tr_dir_fmt += f"-{pos}"
172 tr_dir_fmt += f"-%.{max_len}u"
180 time_option = "--time=" + NanoSecsToSecsStr(r[0]) + "," + NanoSecsToSecsStr(r[1])
183 work_cmd = list(cmd)
263 …process.Popen([perf, "script", "--header-only", "--input", file_name], stdout=subprocess.PIPE).std…
271 name = line[1:pos-1].strip()
273 if name in result:
274 orig_name = name
277 name = f"{orig_name} {nr}"
278 if name not in result:
281 result[name] = value
293 def Init(self, opt_element=-1, value_element=-1, opt_pos=-1, value_pos=-1, error=None):
305 pos = -1
308 if m and opt[:2] == f"-{short_name}":
313 self.Init(error = f"-{short_name} option missing value")
317 if opt[:n] == f"--{long_name}":
322 self.Init(error = f"--{long_name} option missing value")
326 self.Init(error = f"--{long_name} option expected '='")
328 if m and opt[:1] == "-" and opt[:2] != "--" and short_name in opt:
330 if "-" in opt[1:]:
331 hpos = opt[1:].index("-")
338 self.Init(error = f"-{short_name} option missing value")
353 if self.opt_element == -1:
362 def DetermineInputFileName(cmd): argument
363 p = OptPos(cmd, "i", "input", "perf.data")
389 def PerfDoubleQuickCommands(cmd, file_name): argument
390 cpu_str = ReadPerfOption(cmd, "C", "cpu")
391 time_str = ReadPerfOption(cmd, "", "time")
392 # Use double-quick sampling to determine trace data density
393 times_cmd = ["perf", "script", "--ns", "--input", file_name, "--itrace=qqi"]
395 times_cmd.append(f"--cpu={cpu_str}")
397 times_cmd.append(f"--time={time_str}")
399 cnts_cmd.append("-Fcpu")
400 times_cmd.append("-Fcpu,time")
415 cpu_time_range.remaining -= 1
416 cpu_time_range.interval_remaining -= 1
421 time = TimeVal(line[1][:-1], 0)
423 time_ranges[cpu_time_range.tr_pos][1] = time - 1
437 def ProcessCommandOutputLines(cmd, per_cpu, fn, *x): argument
439 pat = re.compile(r"\s*\[[0-9]+\]")
440 p = subprocess.Popen(cmd, stdout=subprocess.PIPE)
444 line = line.decode("utf-8")
449 cpu = int(line[0][1:-1])
490 def SplitTimeRangesByTraceDataDensity(time_ranges, cpus, nr, cmd, file_name, per_cpu, min_size, min… argument
495 cnts_cmd, times_cmd = PerfDoubleQuickCommands(cmd, file_name)
497 nr_cpus = cpus[-1] + 1 if per_cpu else 1
499 nr_cpus = cpus[-1] + 1
503 cpu_time_ranges = [ CPUTimeRange(-1) ]
516 cnt = cpu_time_range.sample_cnt
517 tot += cnt
518 if cnt > mx:
519 mx = cnt
521 print("cpu:", cpu_time_range.cpu, "sample_cnt", cnt)
550 max_time = time_ranges[-1][1]
553 cnt = cpu_time_range.sample_cnt
554 if cnt == 0:
559 n = int(round(cnt / interval, 0))
563 d, m = divmod(cnt, n)
568 cpu_time_range.remaining = cnt
587 duration = int((end - start + 1) / n)
592 time_ranges.append([start, start + duration - 1])
594 time_ranges[-1][1] = end
598 return r[1] - r[0] + 1
630 if new_tr[i - 1][1] + 1 == new_tr[i][0]:
631 new_tr[i][0] = new_tr[i - 1][0]
632 del new_tr[i - 1]
640 if time_ranges[-1][1] >= max_time:
641 time_ranges[-1][1] = None
644 …e_str}'\nCheck also 'time of first sample' and 'time of last sample' in perf script --header-only")
651 if i != 0 and start <= time_ranges[i - 1][1]:
672 …"perf command bad cpu option: '{cpu_str}'\nCheck also 'nrcpus avail' in perf script --header-only")
693 return [-1]
696 a = r.split("-")
720 self.orig_cmd = list(self.cmd)
721 self.perf = self.cmd[0]
725 raise Exception("Bad options (negative values): try -h option for help")
738 print("cmd", self.cmd)
739 self.file_name = DetermineInputFileName(self.cmd)
747 self.time_str = ExtractPerfOption(self.cmd, "", "time")
755 self.cpu_str = ExtractPerfOption(self.cmd, "C", "cpu")
762 self.cpus = [-1]
782 # Re-combined time ranges should be the same
795 …self.worklist = CreateWorkList(self.cmd, self.pipe_to, self.output_dir, self.cpus, self.split_time…
798 if "--per-thread" in self.cmd_line.split():
803 # --no-per-cpu option takes precedence
808 # Default to per-cpu for Intel PT data that was recorded per-cpu,
825 # Prefer open-ended time range to starting / ending with min_time / max_time resp.
851 --cpu and --time so that each job processes a different chunk of the data.
855 Follow the options by '--' and then the perf script command e.g.
857 $ perf record -a -- sleep 10
858 $ parallel-perf.py --nr=4 -- perf script --ns
860 $ tree parallel-perf-output/
861 parallel-perf-output/
862 ├── time-range-0
863 │   ├── cmd.txt
865 ├── time-range-1
866 │   ├── cmd.txt
868 ├── time-range-2
869 │   ├── cmd.txt
871 └── time-range-3
872 ├── cmd.txt
874 $ find parallel-perf-output -name cmd.txt | sort | xargs grep -H .
875 parallel-perf-output/time-range-0/cmd.txt:perf script --time=,9466.504461499 --ns
876 parallel-perf-output/time-range-1/cmd.txt:perf script --time=9466.504461500,9469.005396999 --ns
877 parallel-perf-output/time-range-2/cmd.txt:perf script --time=9469.005397000,9471.506332499 --ns
878 parallel-perf-output/time-range-3/cmd.txt:perf script --time=9471.506332500, --ns
881 --dlfilter and --script, so that the benefit of running parallel jobs
884 If option --pipe-to is used, standard output is first piped through that
890 written to files named err.txt. In addition, files named cmd.txt contain the
894 If any job exits with a non-zero exit code, then all jobs are killed and no
895 more are started. A message is printed if any job results in a non-empty
898 There is a separate output subdirectory for each time range. If the --per-cpu
899 option is used, these are further grouped under cpu-n subdirectories, e.g.
901 $ parallel-perf.py --per-cpu --nr=2 -- perf script --ns --cpu=0,1
903 $ tree parallel-perf-output
904 parallel-perf-output/
905 ├── cpu-0
906 │   ├── time-range-0
907 │   │   ├── cmd.txt
909 │   └── time-range-1
910 │   ├── cmd.txt
912 └── cpu-1
913 ├── time-range-0
914 │   ├── cmd.txt
916 └── time-range-1
917 ├── cmd.txt
919 $ find parallel-perf-output -name cmd.txt | sort | xargs grep -H .
920 parallel-perf-output/cpu-0/time-range-0/cmd.txt:perf script --cpu=0 --time=,9469.005396999 --ns
921 parallel-perf-output/cpu-0/time-range-1/cmd.txt:perf script --cpu=0 --time=9469.005397000, --ns
922 parallel-perf-output/cpu-1/time-range-0/cmd.txt:perf script --cpu=1 --time=,9469.005396999 --ns
923 parallel-perf-output/cpu-1/time-range-1/cmd.txt:perf script --cpu=1 --time=9469.005397000, --ns
925 Subdivisions of time range, and cpus if the --per-cpu option is used, are
926 expressed by the --time and --cpu perf script options respectively. If the
927 supplied perf script command has a --time option, then that time range is
929 'time of last sample' is used (refer perf script --header-only). Similarly, the
930 supplied perf script command may provide a --cpu option, and only those CPUs
933 To prevent time intervals becoming too small, the --min-interval option can
940 double-quick (--itrace=qqi) samples, and choosing time ranges that encompass
942 the same for each CPU processed. For Intel PT, --per-cpu is the default, but
943 that can be overridden by --no-per-cpu. Note, for Intel PT, double-quick
946 perf Intel PT documentation). The minimum number of double-quick samples that
947 will define a time range can be set by the --min_size option, which defaults to
950 …ap.add_argument("-o", "--output-dir", default="parallel-perf-output", help="output directory (defa…
951 …ap.add_argument("-j", "--jobs", type=int, default=0, help="maximum number of jobs to run in parall…
952 …ap.add_argument("-n", "--nr", type=int, default=0, help="number of time subdivisions (default is t…
953 …ap.add_argument("-i", "--interval", type=float, default=0, help="subdivide the time range using th…
954 …ap.add_argument("-c", "--per-cpu", action="store_true", help="process data for each CPU in paralle…
955 …ap.add_argument("-m", "--min-interval", type=float, default=glb_min_interval, help=f"minimum inter…
956 ap.add_argument("-p", "--pipe-to", help="command to pipe output to (optional)")
957 …ap.add_argument("-N", "--no-per-cpu", action="store_true", help="do not process data for each CPU …
958 …ap.add_argument("-b", "--min_size", type=int, default=glb_min_samples, help="minimum data size (fo…
959 …ap.add_argument("-D", "--dry-run", action="store_true", help="do not run any jobs, just show the p…
960 …ap.add_argument("-q", "--quiet", action="store_true", help="do not print any messages except error…
961 ap.add_argument("-v", "--verbose", action="store_true", help="print more messages")
962 ap.add_argument("-d", "--debug", action="store_true", help="print debugging messages")
965 split_pos = cmd_line.index("--")
966 cmd = cmd_line[split_pos + 1:]
969 cmd = None
972 a.cmd = cmd
975 if a.cmd == None:
979 raise Exception("Command line must contain '--' before perf command")