Py-TokenGate/code_inspector.py at trunk · TavariAgent/Py-TokenGate · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
# -*- coding: utf-8 -*-
# code_inspector.py
"""
Pre-execution code inspection for allocation and confidence heuristics.

This module analyzes function bytecode and code-object metadata before
execution to estimate relative complexity, likely resource pressure, and
initial allocation guidance.

The results are heuristic. They are intended to improve first-pass budget
selection and safety decisions before runtime measurements are available.
"""

import dis
import sys
from dataclasses import dataclass
from enum import Enum
from typing import Callable, Dict, Any, List


class ComplexityLevel(Enum):
    """Discrete complexity bands derived from heuristic bytecode analysis."""
    TRIVIAL = 1  # < 10 score: Simple getters, basic math
    SIMPLE = 2  # 10-30: Standard business logic
    MODERATE = 3  # 30-60: Multiple branches, some loops
    COMPLEX = 4  # 60-100: Heavy computation, nested loops
    EXTREME = 5  # > 100: Matrix ops, recursive algorithms


@dataclass
class CodeMetrics:
    """Structured result of one code-object analysis pass."""
    func_name: str
    bytecode_length: int
    stack_size: int
    local_vars: int
    arg_count: int
    const_count: int
    const_footprint: int
    external_calls: List[str]
    loop_count: int
    branch_count: int
    complexity_score: float
    complexity_level: ComplexityLevel
    confidence: float

    def to_dict(self) -> Dict[str, Any]:
        """Return a serialization-friendly dictionary representation."""
        return {
            'func_name': self.func_name,
            'bytecode_length': self.bytecode_length,
            'stack_size': self.stack_size,
            'local_vars': self.local_vars,
            'arg_count': self.arg_count,
            'const_count': self.const_count,
            'const_footprint': self.const_footprint,
            'external_calls': self.external_calls,
            'loop_count': self.loop_count,
            'branch_count': self.branch_count,
            'complexity_score': self.complexity_score,
            'complexity_level': self.complexity_level.name,
            'confidence': self.confidence
        }


class CodeInspector:
    """Static bytecode analyzer for pre-execution resource heuristics.

    Inspects code objects to derive complexity indicators, confidence scores,
    and initial allocation recommendations before runtime profiling exists.
    """

    # Weight factors for complexity calculation
    WEIGHTS = {
        'bytecode': 0.3,  # Bytecode length impact
        'stack': 0.2,  # Stack depth impact
        'constants': 0.15,  # Constant footprint impact
        'calls': 0.15,  # External call impact
        'loops': 0.1,  # Loop impact
        'branches': 0.1  # Branch impact
    }

    # Confidence modifiers
    CONFIDENCE_BASE = 85.0  # Start at 85% confidence
    CONFIDENCE_DECAY = 0.3  # Lose 0.3% per complexity point above 50

    @staticmethod
    def analyze(func: Callable) -> CodeMetrics:
        """
        Analyze a callable's code object and derive heuristic complexity metrics.

        Args:
            func: Callable to inspect. Must expose a ``__code__`` attribute.

        Returns:
            CodeMetrics containing bytecode, control-flow, and confidence data.
        """
        if not hasattr(func, '__code__'):
            raise ValueError(f"Function {func} has no __code__ attribute")

        code = func.__code__  # type: ignore[attr-defined]

        # Extract basic metrics
        func_name = code.co_name
        bytecode_length = len(code.co_code)
        stack_size = code.co_stacksize
        local_vars = code.co_nlocals
        arg_count = code.co_argcount

        # Analyze constants
        const_count = len(code.co_consts)
        const_footprint = CodeInspector._calculate_const_footprint(code.co_consts)

        # Analyze external calls
        external_calls = CodeInspector._extract_external_calls(code)

        # Analyze control flow
        loop_count = CodeInspector._estimate_loops(code)
        branch_count = CodeInspector._estimate_branches(code)

        # Calculate complexity score
        complexity_score = CodeInspector._calculate_complexity(
            bytecode_length=bytecode_length,
            stack_size=stack_size,
            const_footprint=const_footprint,
            external_calls_count=len(external_calls),
            loop_count=loop_count,
            branch_count=branch_count
        )

        # Classify complexity
        complexity_level = CodeInspector._classify_complexity(complexity_score)

        # Calculate confidence
        confidence = CodeInspector._calculate_confidence(complexity_score)

        return CodeMetrics(
            func_name=func_name,
            bytecode_length=bytecode_length,
            stack_size=stack_size,
            local_vars=local_vars,
            arg_count=arg_count,
            const_count=const_count,
            const_footprint=const_footprint,
            external_calls=external_calls,
            loop_count=loop_count,
            branch_count=branch_count,
            complexity_score=complexity_score,
            complexity_level=complexity_level,
            confidence=confidence
        )

    @staticmethod
    def _calculate_const_footprint(consts: tuple) -> int:
        """Estimate the memory footprint of constants referenced by a code object."""
        footprint = 0

        for const in consts:
            if const is None:
                continue

            if isinstance(const, (str, bytes)):
                footprint += len(const)
            elif isinstance(const, (list, tuple)):
                # Recursively estimate collection size
                footprint += sys.getsizeof(const)
            elif isinstance(const, dict):
                footprint += sys.getsizeof(const)
            elif isinstance(const, (int, float)):
                footprint += sys.getsizeof(const)
            else:
                # Generic object
                try:
                    footprint += sys.getsizeof(const)
                except:
                    footprint += 64  # Default estimate

        return footprint

    @staticmethod
    def _extract_external_calls(code) -> List[str]:
        """Collect referenced external names from the code object.

        This is a name-based heuristic used to flag likely library, I/O, or
        dynamic-execution behavior.
        """
        external_calls = []
        names = set(code.co_names)

        # Common expensive operations
        expensive_patterns = [
            'json', 'pickle', 'marshal',  # Serialization
            'requests', 'urllib', 'http',  # Network
            'open', 'read', 'write',  # File I/O
            'numpy', 'pandas', 'scipy',  # Heavy computation
            'compile', 'exec', 'eval',  # Dynamic execution
            'time.sleep', 'asyncio.sleep'  # Blocking operations
        ]

        for name in names:
            # Track all names but flag expensive ones
            external_calls.append(name)

        return sorted(external_calls)

    @staticmethod
    def _estimate_loops(code) -> int:
        """Estimate loop presence from bytecode instruction patterns."""
        loop_count = 0
        instructions = list(dis.get_instructions(code))

        for instr in instructions:
            # FOR_ITER indicates a for loop
            if instr.opname == 'FOR_ITER':
                loop_count += 1
            # JUMP_BACKWARD can indicate while loops
            elif instr.opname in ('JUMP_BACKWARD', 'JUMP_ABSOLUTE'):
                # Be conservative - not all jumps are loops
                # Only count backward jumps as likely loops
                if hasattr(instr, 'argval') and isinstance(instr.argval, int):
                    if instr.argval < instr.offset:
                        loop_count += 0.5  # Weight lower since might not be loop

        return int(loop_count)

    @staticmethod
    def _estimate_branches(code) -> int:
        """Estimate conditional branch count from jump instructions."""
        branch_count = 0
        instructions = list(dis.get_instructions(code))

        for instr in instructions:
            if 'POP_JUMP' in instr.opname or 'JUMP_IF' in instr.opname:
                branch_count += 1

        return branch_count

    @staticmethod
    def _calculate_complexity(
            bytecode_length: int,
            stack_size: int,
            const_footprint: int,
            external_calls_count: int,
            loop_count: int,
            branch_count: int
    ) -> float:
        """
        Combine normalized static indicators into a heuristic complexity score.

        Higher scores suggest greater structural complexity and potentially
        higher initial resource pressure.
        """
        # Normalize metrics to 0-1 scale
        # These thresholds are heuristic - adjust based on real data
        norm_bytecode = min(bytecode_length / 500, 1.0)
        norm_stack = min(stack_size / 20, 1.0)
        norm_constants = min(const_footprint / 10000, 1.0)
        norm_calls = min(external_calls_count / 15, 1.0)
        norm_loops = min(loop_count / 5, 1.0)
        norm_branches = min(branch_count / 10, 1.0)

        # Apply weights
        w = CodeInspector.WEIGHTS
        weighted_sum = (
                norm_bytecode * w['bytecode'] +
                norm_stack * w['stack'] +
                norm_constants * w['constants'] +
                norm_calls * w['calls'] +
                norm_loops * w['loops'] +
                norm_branches * w['branches']
        )

        # Scale to 0-200+ range (most functions will be 0-100)
        complexity = weighted_sum * 200

        return round(complexity, 2)

    @staticmethod
    def _classify_complexity(score: float) -> ComplexityLevel:
        """Map a complexity score to its configured complexity band."""
        if score < 10:
            return ComplexityLevel.TRIVIAL
        elif score < 30:
            return ComplexityLevel.SIMPLE
        elif score < 60:
            return ComplexityLevel.MODERATE
        elif score < 100:
            return ComplexityLevel.COMPLEX
        else:
            return ComplexityLevel.EXTREME

    @staticmethod
    def _calculate_confidence(complexity_score: float) -> float:
        """
        Convert complexity score into a heuristic prediction-confidence value.

        Simpler functions retain higher confidence; more structurally complex
        functions reduce confidence.
        """
        base = CodeInspector.CONFIDENCE_BASE
        decay = CodeInspector.CONFIDENCE_DECAY

        if complexity_score <= 50:
            # Simple functions maintain high confidence
            confidence = base
        else:
            # Complex functions lose confidence
            excess_complexity = complexity_score - 50
            confidence = base - (excess_complexity * decay)

        # Clamp to a reasonable range
        confidence = max(20.0, min(95.0, confidence))

        return round(confidence, 1)

    @staticmethod
    def predict_initial_allocation(metrics: CodeMetrics, base_budget_mb: int = 50) -> Dict[str, Any]:
        """
        Derive an initial memory and timeout recommendation from analyzed metrics.

        Args:
            metrics: CodeMetrics returned by ``analyze()``.
            base_budget_mb: Baseline memory budget used for scaling.

        Returns:
            Dictionary containing recommended memory, timeout, confidence,
            reasoning text, and the underlying complexity score.
        """
        # Complexity-based multipliers
        multipliers = {
            ComplexityLevel.TRIVIAL: 0.5,
            ComplexityLevel.SIMPLE: 1.0,
            ComplexityLevel.MODERATE: 1.5,
            ComplexityLevel.COMPLEX: 2.5,
            ComplexityLevel.EXTREME: 4.0
        }

        multiplier = multipliers[metrics.complexity_level]

        # Calculate allocations
        memory_mb = int(base_budget_mb * multiplier)

        # Timeout based on complexity
        timeout_seconds = 10 + (metrics.complexity_score * 0.5)
        timeout_seconds = min(timeout_seconds, 300)  # Cap at 5 minutes

        # Build reasoning
        reasoning = f"Complexity: {metrics.complexity_level.name} (score: {metrics.complexity_score:.1f}), "
        reasoning += f"Confidence: {metrics.confidence}%"

        if metrics.loop_count > 0:
            reasoning += f", {metrics.loop_count} loop(s)"
        if len(metrics.external_calls) > 5:
            reasoning += f", {len(metrics.external_calls)} external calls"

        return {
            'memory_mb': memory_mb,
            'timeout_seconds': timeout_seconds,
            'confidence': metrics.confidence,
            'reasoning': reasoning,
            'complexity_score': metrics.complexity_score
        }


# ============================================================================
# TESTING & EXAMPLES
# ============================================================================

if __name__ == '__main__':

    print("=" * 70)
    print("CODE INSPECTOR TEST")
    print("=" * 70)
    print()


    # Test functions with varying complexity

    def trivial_function(x):
        """Trivial: just return input."""
        return x


    def simple_function(a, b):
        """Simple: basic arithmetic."""
        return a + b * 2


    def moderate_function(data):
        """Moderate: some loops and logic."""
        result = []
        for item in data:
            if item > 0:
                result.append(item * 2)
        return result


    def complex_function(size):
        """Complex: nested loops."""
        matrix = [[0 for _ in range(size)] for _ in range(size)]
        for i in range(size):
            for j in range(size):
                matrix[i][j] = i * j
        return matrix


    def extreme_function(n):
        """Extreme: recursive + heavy computation."""
        if n <= 1:
            return 1
        result = extreme_function(n - 1) + extreme_function(n - 2)
        data = [i ** 2 for i in range(100)]
        return result + sum(data)


    # Analyze each function
    test_functions = [
        trivial_function,
        simple_function,
        moderate_function,
        complex_function,
        extreme_function
    ]

    for func in test_functions:
        print("-" * 70)
        print(f"Analyzing: {func.__name__}")
        print("-" * 70)

        metrics = CodeInspector.analyze(func)

        print(f"  Bytecode length:  {metrics.bytecode_length}")
        print(f"  Stack size:       {metrics.stack_size}")
        print(f"  Local vars:       {metrics.local_vars}")
        print(f"  Constants:        {metrics.const_count} ({metrics.const_footprint} bytes)")
        print(f"  External calls:   {len(metrics.external_calls)}")
        if metrics.external_calls:
            print(f"    Calls: {', '.join(metrics.external_calls[:5])}")
        print(f"  Loops:            {metrics.loop_count}")
        print(f"  Branches:         {metrics.branch_count}")
        print()
        print(f"  Complexity Score: {metrics.complexity_score:.1f}")
        print(f"  Complexity Level: {metrics.complexity_level.name}")
        print(f"  Confidence:       {metrics.confidence}%")
        print()

        # Get allocation prediction
        allocation = CodeInspector.predict_initial_allocation(metrics)
        print(f"  Recommended Allocation:")
        print(f"    Memory:   {allocation['memory_mb']} MB")
        print(f"    Timeout:  {allocation['timeout_seconds']:.0f} seconds")
        print(f"    Reasoning: {allocation['reasoning']}")
        print()

    print("=" * 70)
    print("INSPECTOR TEST COMPLETE")
    print("=" * 70)
    print()
    print("Next Steps:")
    print("  1. Integrate with overflow_guard.py")
    print("  2. Add token-level tracking")
    print("  3. Implement retry logic with allocation bumping")
    print("  4. Build confidence-weighted optimization (2% drops)")