summaryrefslogtreecommitdiffstats
path: root/Doc/lib/libdis.tex
blob: 959c80fb94563c69929ba89d61809aa335a54728 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
\section{Standard module \sectcode{dis}}	% If implemented in Python
\stmodindex{dis}

\label{module-dis}

The \code{dis} module supports the analysis of Python byte code by
disassembling it.  Since there is no Python assembler, this module
defines the Python assembly language.  The Python byte code which
this module takes as an input is defined in the file 
\code{Include/opcode.h} and used by the compiler and the interpreter.

Example: Given the function myfunc

\bcode\begin{verbatim}
def myfunc(alist):
  return len(alist)
\end{verbatim}\ecode

the following command can be used to get the disassembly of myfunc:

\begin{verbatim}
>>> dis.dis(myfunc)
          0 SET_LINENO          1

          3 SET_LINENO          2
          6 LOAD_GLOBAL         0 (len)
          9 LOAD_FAST           0 (alist)
         12 CALL_FUNCTION       1
         15 RETURN_VALUE   
         16 LOAD_CONST          0 (None)
         19 RETURN_VALUE   
\end{verbatim}

The \code{dis} module defines the following functions:

\renewcommand{\indexsubitem}{(in module dis)}

% ---- 3.2. ----
% For each function, use a ``funcdesc'' block.  This has exactly two
% parameters (each parameters is contained in a set of curly braces):
% the first parameter is the function name (this automatically
% generates an index entry); the second parameter is the function's
% argument list.  If there are no arguments, use an empty pair of
% curly braces.  If there is more than one argument, separate the
% arguments with backslash-comma.  Optional parts of the parameter
% list are contained in \optional{...} (this generates a set of square
% brackets around its parameter).  Arguments are automatically set in
% italics in the parameter list.  Each argument should be mentioned at
% least once in the description; each usage (even inside \code{...})
% should be enclosed in \var{...}.

\begin{funcdesc}{dis}{\optional{bytesource}}
Disassemble the \var{bytesource} object. \var{bytesource} can denote
either a class, a method, a function, or a code object.  For a class,
it disassembles all methods.  For a single code sequence, it prints
one line per byte code instruction.  If no object is provided, it
disassembles the last traceback.
\end{funcdesc}

\begin{funcdesc}{distb}{\optional{tb}}
Disassembles the top-of-stack function of a traceback, using the last
traceback if none was passed.  The instruction causing the exception
is indicated.
\end{funcdesc}

\begin{funcdesc}{disassemble}{code\optional{\, lasti}}
Disassembles a code object, indicating the last instruction if \var{lasti}
was provided.  The output is divided in the following columns:
\begin{itemize}
\item the current instruction, indicated as \code{-->},
\item a labelled instruction, indicated with \code{>>},
\item the address of the instruction,
\item the operation code name,
\item operation parameters, and
\item interpretation of the parameters in parentheses.
\end{itemize}
The parameter interpretation recognizes local and global
variable names, constant values, branch targets, and compare
operators.
\end{funcdesc}

\begin{funcdesc}{disco}{code\optional{\, lasti}}
A synonym for disassemble.  It is more convenient to type, and kept
for compatibility with earlier Python releases.
\end{funcdesc}

\begin{datadesc}{opname}
Sequence of a operation names, indexable using the byte code.
\end{datadesc}

\begin{datadesc}{cmp_op}
Sequence of all compare operation names.
\end{datadesc}

\begin{datadesc}{hasconst}
Sequence of byte codes that have a constant parameter.
\end{datadesc}

\begin{datadesc}{hasname}
Sequence of byte codes that access a attribute by name.
\end{datadesc}

\begin{datadesc}{hasjrel}
Sequence of byte codes that have a relative jump target.
\end{datadesc}

\begin{datadesc}{hasjabs}
Sequence of byte codes that have an absolute jump target.
\end{datadesc}

\begin{datadesc}{haslocal}
Sequence of byte codes that access a a local variable.
\end{datadesc}

\begin{datadesc}{hascompare}
Sequence of byte codes of boolean operations.
\end{datadesc}

\subsection{Python Byte Code Instructions}

The Python compiler currently generates the following byte code
instructions.

\renewcommand{\indexsubitem}{(byte code insns)}

\begin{funcdesc}{STOP_CODE}{}
Indicates end-of-code to the compiler, not used by the interpreter.
\end{funcdesc}

\begin{funcdesc}{POP_TOP}{}
Removes the top-of-stack (TOS) item.
\end{funcdesc}

\begin{funcdesc}{ROT_TWO}{}
Swaps the two top-most stack items.
\end{funcdesc}

\begin{funcdesc}{ROT_THREE}{}
Lifts second and third stack item on position up, moves top down
to position three.
\end{funcdesc}

\begin{funcdesc}{DUP_TOP}{}
Duplicates the reference on top of the stack.
\end{funcdesc}

Unary Operations take the top of the stack, apply the operation, and
push the result back on the stack.

\begin{funcdesc}{UNARY_POSITIVE}{}
Implements \code{TOS = +TOS}.
\end{funcdesc}

\begin{funcdesc}{UNARY_NEG}{}
Implements \code{TOS = -TOS}.
\end{funcdesc}

\begin{funcdesc}{UNARY_NOT}{}
Implements \code{TOS = not TOS}.
\end{funcdesc}

\begin{funcdesc}{UNARY_CONVERT}{}
Implements \code{TOS = `TOS`}.
\end{funcdesc}

\begin{funcdesc}{UNARY_INVERT}{}
Implements \code{TOS = ~TOS}.
\end{funcdesc}

Binary operations remove the top of the stack (TOS) and the second top-most
stack item (TOS1) from the stack.  They perform the operation, and put the
result back on the stack.

\begin{funcdesc}{BINARY_POWER}{}
Implements \code{TOS = TOS1 ** TOS}.
\end{funcdesc}

\begin{funcdesc}{BINARY_MULTIPLY}{}
Implements \code{TOS = TOS1 * TOS}.
\end{funcdesc}

\begin{funcdesc}{BINARY_DIVIDE}{}
Implements \code{TOS = TOS1 / TOS}.
\end{funcdesc}

\begin{funcdesc}{BINARY_MODULO}{}
Implements \code{TOS = TOS1 \% TOS}.
\end{funcdesc}

\begin{funcdesc}{BINARY_ADD}{}
Implements \code{TOS = TOS1 + TOS}.
\end{funcdesc}

\begin{funcdesc}{BINARY_SUBTRACT}{}
Implements \code{TOS = TOS1 - TOS}.
\end{funcdesc}

\begin{funcdesc}{BINARY_SUBSCR}{}
Implements \code{TOS = TOS1[TOS] }.
\end{funcdesc}

\begin{funcdesc}{BINARY_LSHIFT}{}
Implements \code{TOS = TOS1 << TOS }.
\end{funcdesc}

\begin{funcdesc}{BINARY_RSHIFT}{}
Implements \code{TOS = TOS1 << TOS }.
\end{funcdesc}

\begin{funcdesc}{BINARY_AND}{}
Implements \code{TOS = TOS1 and TOS }.
\end{funcdesc}

\begin{funcdesc}{BINARY_XOR}{}
Implements \code{TOS = TOS1 \^{ }TOS }.
\end{funcdesc}

\begin{funcdesc}{BINARY_OR}{}
Implements \code{TOS = TOS1 or TOS }.
\end{funcdesc}

The slice opcodes take up to three parameters.

\begin{funcdesc}{SLICE+0}{}
Implements \code{TOS = TOS[:]}.
\end{funcdesc}

\begin{funcdesc}{SLICE+1}{}
Implements \code{TOS = TOS1[TOS:]}.
\end{funcdesc}

\begin{funcdesc}{SLICE+2}{}
Implements \code{TOS = TOS1[:TOS1]}.
\end{funcdesc}

\begin{funcdesc}{SLICE+3}{}
Implements \code{TOS = TOS2[TOS1:TOS]}.
\end{funcdesc}

Slice assignment needs even an additional parameter.  As any statement,
they put nothing on the stack.

\begin{funcdesc}{STORE_SLICE+0}{}
Implements \code{TOS[:]=TOS1}.
\end{funcdesc}

\begin{funcdesc}{STORE_SLICE+1}{}
Implements \code{TOS1[TOS:]=TOS2}.
\end{funcdesc}

\begin{funcdesc}{STORE_SLICE+2}{}
Implements \code{TOS1[:TOS]=TOS2}.
\end{funcdesc}

\begin{funcdesc}{STORE_SLICE+3}{}
Implements \code{TOS2[TOS1:TOS]=TOS3}.
\end{funcdesc}

\begin{funcdesc}{DELETE_SLICE+0}{}
Implements \code{del TOS[:]}.
\end{funcdesc}

\begin{funcdesc}{DELETE_SLICE+1}{}
Implements \code{del TOS1[TOS:]}.
\end{funcdesc}

\begin{funcdesc}{DELETE_SLICE+2}{}
Implements \code{del TOS1[:TOS]}.
\end{funcdesc}

\begin{funcdesc}{DELETE_SLICE+3}{}
Implements \code{del TOS2[TOS1:TOS]}.
\end{funcdesc}

\begin{funcdesc}{STORE_SUBSCR}{}
Implements \code{TOS1[TOS]=TOS2}.
\end{funcdesc}

\begin{funcdesc}{DELETE_SUBSCR}{}
Implements \code{del TOS1[TOS]}.
\end{funcdesc}

\begin{funcdesc}{PRINT_EXPR}{}
Implements the expression statement for the interactive mode.  TOS is
removed from the stack and printed.  In non-interactive mode, an
expression statement is terminated with POP_STACK.
\end{funcdesc}

\begin{funcdesc}{PRINT_ITEM}{}
Prints TOS.  There is one such instruction for
each item in the print statement.
\end{funcdesc}

\begin{funcdesc}{PRINT_NEWLINE}{}
Prints a new line on \code{sys.stdout}.  This is generated as the
last operation of a print statement, unless the statement ends
with a comma.
\end{funcdesc}

\begin{funcdesc}{BREAK_LOOP}{}
Terminates a loop due to a break statement.
\end{funcdesc}

\begin{funcdesc}{LOAD_LOCALS}{}
Pushes a reference to the locals of the current scope on the stack.
This is used in the code for a class definition: After the class body
is evaluated, the locals are passed to the class definition.
\end{funcdesc}

\begin{funcdesc}{RETURN_VALUE}{}
Returns with TOS to the caller of the function.
\end{funcdesc}

\begin{funcdesc}{EXEC_STMT}{}
Implements \code{exec TOS2,TOS1,TOS}.  The compiler fills
missing optional parameters with None.
\end{funcdesc}

\begin{funcdesc}{POP_BLOCK}{}
Removes one block from the block stack.  Per frame, there is a 
stack of blocks, denoting nested loops, try statements, and such.
\end{funcdesc}

\begin{funcdesc}{END_FINALLY}{}
Terminates a finally-block.  The interpreter recalls whether the
exception has to be re-raised, or whether the function returns,
and continues with the outer-next block.
\end{funcdesc}

\begin{funcdesc}{BUILD_CLASS}{}
Creates a new class object.  TOS is the methods dictionary, TOS1
the tuple of the names of the base classes, and TOS2 the class name.
\end{funcdesc}

All of the following opcodes expect arguments.  An argument is two
bytes, with the more significant byte last.

\begin{funcdesc}{STORE_NAME}{namei}
Implements \code{name = TOS}. \var{namei} is the index of \var{name}
in the attribute \code{co_names} of the code object.
The compiler tries to use STORE_LOCAL or STORE_GLOBAL if possible.
\end{funcdesc}

\begin{funcdesc}{DELETE_NAME}{namei}
Implements \code{del name}, where \var{namei} is the index into
\code{co_names} attribute of the code object.
\end{funcdesc}

\begin{funcdesc}{UNPACK_TUPLE}{count}
Unpacks TOS into \var{count} individual values, which are put onto
the stack right-to-left.
\end{funcdesc}

\begin{funcdesc}{UNPACK_LIST}{count}
Unpacks TOS into \var{count} individual values.
\end{funcdesc}

%\begin{funcdesc}{UNPACK_ARG}{count}
%This opcode is obsolete.
%\end{funcdesc}

\begin{funcdesc}{STORE_ATTR}{namei}
Implements \code{TOS.name = TOS1}, where \var{namei} is the index
of name in \code{co_names}.
\end{funcdesc}

\begin{funcdesc}{DELETE_ATTR}{namei}
Implements \code{del TOS.name}, using \var{namei} as index into
\code{co_names}.
\end{funcdesc}

\begin{funcdesc}{STORE_GLOBAL}{namei}
Works as STORE_NAME, but stores the name as a global.
\end{funcdesc}

\begin{funcdesc}{DELETE_GLOBAL}{namei}
Works as DELETE_NAME, but deletes a global name.
\end{funcdesc}

%\begin{funcdesc}{UNPACK_VARARG}{argc}
%This opcode is obsolete.
%\end{funcdesc}

\begin{funcdesc}{LOAD_CONST}{consti}
Pushes \code{co_consts[consti]} onto the stack.
\end{funcdesc}

\begin{funcdesc}{LOAD_NAME}{namei}
Pushes the value associated with \code{co_names[namei]} onto the stack.
\end{funcdesc}

\begin{funcdesc}{BUILD_TUPLE}{count}
Creates a tuple consuming \var{count} items from the stack, and pushes
the resulting tuple onto the stack.
\end{funcdesc}

\begin{funcdesc}{BUILD_LIST}{count}
Works as \code{BUILD_TUPLE}, but creates a list.
\end{funcdesc}

\begin{funcdesc}{BUILD_MAP}{zero}
Pushes an empty dictionary object onto the stack.  The argument is ignored
and set to zero by the compiler.
\end{funcdesc}

\begin{funcdesc}{LOAD_ATTR}{namei}
Replaces TOS with \code{getattr(TOS,co_names[namei]}.
\end{funcdesc}

\begin{funcdesc}{COMPARE_OP}{opname}
Performs a boolean operation.  The operation name can be found
in \code{cmp_op[opname]}.
\end{funcdesc}

\begin{funcdesc}{IMPORT_NAME}{namei}
Imports the module \code{co_names[namei]}.  The module object is
pushed onto the stack.  The current name space is not affect: for a
proper import statement, a subsequent \code{STORE_FAST} instruction
modifies the name space.
\end{funcdesc}

\begin{funcdesc}{IMPORT_FROM}{namei}
Imports the attribute \code{co_names[namei]}.  The module to import
from is found in TOS and left there.
\end{funcdesc}

\begin{funcdesc}{JUMP_FORWARD}{delta}
Increments byte code counter by \var{delta}.
\end{funcdesc}

\begin{funcdesc}{JUMP_IF_TRUE}{delta}
If TOS is true, increment the byte code counter by \var{delta}.  TOS is
left on the stack.
\end{funcdesc}

\begin{funcdesc}{JUMP_IF_FALSE}{delta}
If TOS is false, increment the byte code counter by \var{delta}.  TOS
is not changed. 
\end{funcdesc}

\begin{funcdesc}{JUMP_ABSOLUTE}{target}
Set byte code counter to \var{target}.
\end{funcdesc}

\begin{funcdesc}{FOR_LOOP}{delta}
Iterate over a sequence.  TOS is the current index, TOS1 the sequence.
First, the next element is computed.  If the sequence is exhausted,
increment byte code counter by \var{delta}.  Otherwise, push the
sequence, the incremented counter, and the current item onto the stack.
\end{funcdesc}

%\begin{funcdesc}{LOAD_LOCAL}{namei}
%This opcode is obsolete.
%\end{funcdesc}

\begin{funcdesc}{LOAD_GLOBAL}{namei}
Loads the global named \code{co_names[namei]} onto the stack.
\end{funcdesc}

%\begin{funcdesc}{SET_FUNC_ARGS}{argc}
%This opcode is obsolete.
%\end{funcdesc}

\begin{funcdesc}{SETUP_LOOP}{delta}
Pushes a block for a loop onto the block stack.  The block spans
from the current instruction with a size of \var{delta} bytes.
\end{funcdesc}

\begin{funcdesc}{SETUP_EXCEPT}{delta}
Pushes a try block from a try-except clause onto the block stack.
\var{delta} points to the first except block.
\end{funcdesc}

\begin{funcdesc}{SETUP_FINALLY}{delta}
Pushes a try block from a try-except clause onto the block stack.
\var{delta} points to the finally block.
\end{funcdesc}

\begin{funcdesc}{LOAD_FAST}{var_num}
Pushes a reference to the local \code{co_varnames[var_num]} onto
the stack.
\end{funcdesc}

\begin{funcdesc}{STORE_FAST}{var_num}
Stores TOS into the local \code{co_varnames[var_num]}.
\end{funcdesc}

\begin{funcdesc}{DELETE_FAST}{var_num}
Deletes local \code{co_varnames[var_num]}.
\end{funcdesc}

\begin{funcdesc}{SET_LINE_NO}{lineno}
Sets the current line number to \var{lineno}.
\end{funcdesc}

\begin{funcdesc}{RAISE_VARARGS}{argc}
Raises an exception. \var{argc} indicates the number of parameters
to the raise statement, ranging from 1 to 3.  The handler will find
the traceback as TOS2, the parameter as TOS1, and the exception
as TOS.
\end{funcdesc}

\begin{funcdesc}{CALL_FUNCTION}{argc}
Calls a function.  The low byte of \var{argc} indicates the number of
positional parameters, the high byte the number of keyword parameters.
On the stack, the opcode finds the keyword parameters first.  For each
keyword argument, the value is on top of the key.  Below the keyword
parameters, the positional parameters are on the stack, with the
right-most parameter on top.  Below the parameters, the function object
to call is on the stack.
\end{funcdesc}

\begin{funcdesc}{MAKE_FUNCTION}{argc}
Pushes a new function object on the stack.  TOS is the code associated
with the function.  The function object is defined to have \var{argc}
default parameters, which are found below TOS.
\end{funcdesc}

\begin{funcdesc}{BUILD_SLICE}{argc}
Pushes a slice object on the stack.  If \var{argc} is three, creates
\code{TOS3[TOS2:TOS1:TOS]}.  Otherwise, expects three arguments.
\end{funcdesc}