#!/bin/bash # # Use sys.setprofile() and maybe sys.settrace() to trace Oil execution. # # Usage: # ./pytrace.sh set -o nounset set -o pipefail set -o errexitsetconst global FOO = "bar" readonly ABUILD = ""setconst global FOO = "bar"~/git/alpine/abuild/abuild readonly -a RUN_ABUILD = '('bin/oil.py osh $ABUILD -h) # # Use Python's cProfile, which uses _lsprof. This is pretty fast. # # ~2.7 seconds without tracing proc abuild { time $(RUN_ABUILD[@]) ls -l -h *.json } # 3.8 seconds. So less than 2x overhead. proc cprofile-abuild { var out = 'abuild.cprofile' time python -m cProfile -o $out $(RUN_ABUILD[@]) ls -l $out } # Yeah I understand from this why Chrome Tracing / Flame Graphs are better. # This format doesn't respect the stack! # cumtime: bin/oil.py is the top, obviously proc print-cprofile { python -c ' import pstats p = pstats.Stats("abuild.cprofile") p.sort_stats("tottime").print_stats() ' } # # My Own Tracing with pytrace.py. Too slow! # # Abuild call/return events: # Parsing: 4,345,706 events # Execution: 530,924 events # Total events: # 14,918,308 # Actually that is still doable as binary. Not sure it's viewable in Chrome # though. # 14 bytes * 14.9M is 209 MB. proc abuild-trace { env _PY_TRACE=abuild.pytrace time $(RUN_ABUILD[@]) } # # Depends on pytracing, which is also too slow. # # Trace a parsing function proc parse { #local script=$ABUILD var script = $0 time bin/oil.py osh -n $script >/dev/null } # Trace the execution proc execute { #local script=$ABUILD var script = $0 #time bin/oil.py osh -c 'echo hi' time bin/oil.py osh $0 ls -l -h *.json } # Idea: I Want a flame graph based on determistic data! That way you get the # full stack trace. # It wasn't happening in the python-flamegraph stuff for some reason. Not sure # why. I think it is because I/O was exaggerated. # # Interpreter hook: # # for thread_id, frame in sys._current_frames().items(): # if thread_id == my_thread: # continue # Note that opening file descriptors can cause bugs! I have to open it above # descriptor 10! # python-flamegraph # - suffers from measurement error due to threads. # - is RunCommandSub is being inflated? # - well actually i'm not sure. I have to do it myself on a single thread # and see. # pytracing: # - the format is too bloated. It can't handle abuild -h. So I have to # optimize it. # # I want to unify these two approaches: both flame graphs and function traces. # # Advantage: sys.setprofile() gets C function call events! # # Reservoir Sampling! Get a list of all unique stacks. # # You can figure out the stack from the current/call/return sequence. So you # can use the reservoir sampling algorithm to get say 100,000 random stacks out # of 14 M events. # # sys.getframes() @Argv (CommandList children: [ (C {(set)} {(-o)} {(nounset)}) (C {(set)} {(-o)} {(pipefail)}) (C {(set)} {(-o)} {(errexit)}) (Assignment keyword: Assign_Readonly pairs: [ (assign_pair lhs: (LhsName name:ABUILD) op: Equal rhs: {(TildeSubPart prefix:"") (/git/alpine/abuild/abuild)} spids: [40] ) ] spids: [38] ) (Assignment keyword: Assign_Readonly flags: ["'-a'"] pairs: [ (assign_pair lhs: (LhsName name:RUN_ABUILD) op: Equal rhs: {(ArrayLiteralPart words:[{(bin/oil.py)}{(osh)}{($ VSub_Name "$ABUILD")}{(-h)}])} spids: [49] ) ] spids: [45] ) (FuncDef name: abuild body: (BraceGroup children: [ (TimeBlock pipeline: (C { (DQ (BracedVarSub token: bracket_op: (WholeArray op_id:Lit_At) spids: [84 89] ) ) } ) ) (C {(ls)} {(-l)} {(-h)} {(Lit_Other "*") (.json)}) ] spids: [78] ) spids: [74 77] ) (FuncDef name: cprofile-abuild body: (BraceGroup children: [ (Assignment keyword: Assign_Local pairs: [ (assign_pair lhs: (LhsName name:out) op: Equal rhs: {(abuild.cprofile)} spids: [118] ) ] spids: [116] ) (TimeBlock pipeline: (C {(python)} {(-m)} {(cProfile)} {(-o)} {($ VSub_Name "$out")} { (DQ (BracedVarSub token: bracket_op: (WholeArray op_id:Lit_At) spids: [136 141] ) ) } ) ) (C {(ls)} {(-l)} {($ VSub_Name "$out")}) ] spids: [113] ) spids: [109 112] ) (FuncDef name: print-cprofile body: (BraceGroup children: [ (C {(python)} {(-c)} { (SQ <"\n"> <"import pstats\n"> <"p = pstats.Stats(\"abuild.cprofile\")\n"> <"p.sort_stats(\"tottime\").print_stats()\n"> ) } ) ] spids: [167] ) spids: [163 166] ) (FuncDef name: abuild-trace body: (BraceGroup children: [ (SimpleCommand words: [ {(KW_Time time)} { (DQ (BracedVarSub token: bracket_op: (WholeArray op_id:Lit_At) spids: [234 239] ) ) } ] more_env: [(env_pair name:_PY_TRACE val:{(abuild.pytrace)} spids:[228])] ) ] spids: [225] ) spids: [221 224] ) (FuncDef name: parse body: (BraceGroup children: [ (Assignment keyword: Assign_Local pairs: [ (assign_pair lhs: (LhsName name:script) op: Equal rhs: {($ VSub_Number "$0")} spids: [271] ) ] spids: [269] ) (TimeBlock pipeline: (SimpleCommand words: [{(bin/oil.py)} {(osh)} {(-n)} {($ VSub_Name "$script")}] redirects: [(Redir op_id:Redir_Great fd:-1 arg_word:{(/dev/null)} spids:[285])] ) ) ] spids: [262] ) spids: [258 261] ) (FuncDef name: execute body: (BraceGroup children: [ (Assignment keyword: Assign_Local pairs: [ (assign_pair lhs: (LhsName name:script) op: Equal rhs: {($ VSub_Number "$0")} spids: [307] ) ] spids: [305] ) (TimeBlock pipeline:(C {(bin/oil.py)} {(osh)} {($ VSub_Number "$0")})) (C {(ls)} {(-l)} {(-h)} {(Lit_Other "*") (.json)}) ] spids: [298] ) spids: [294 297] ) (C {(DQ ($ VSub_At "$@"))}) ] )