Files

191 lines
5.4 KiB
Python

"""
JCL Parser - parses JCL scripts into structured JobStep objects.
Phase 1: supports JOB, EXEC PGM=, DD, SYSOUT, SYSIN inline data,
COND=(code,op), * comments.
Phase 2+: PROC, GDG, COND with step names, EVEN/ONLY.
"""
import re
from dataclasses import dataclass, field
from typing import Optional
@dataclass
class DDEntry:
dd_name: str
dsn: Optional[str] = None
disp: Optional[str] = None
sysout: Optional[str] = None
inline_data: list[str] = field(default_factory=list)
unit: Optional[str] = None
space: Optional[str] = None
@dataclass
class CondParam:
code: int
operator: str # EQ, NE, GT, GE, LT, LE
step_name: Optional[str] = None # None means "any previous step"
@dataclass
class JobStep:
step_name: str
program: str
dd_entries: list[DDEntry] = field(default_factory=list)
cond: Optional[CondParam] = None
parm: Optional[str] = None
@dataclass
class Job:
job_name: str
steps: list[JobStep] = field(default_factory=list)
# COND operator mapping
COND_OPS = {
"EQ": lambda rc, code: rc == code,
"NE": lambda rc, code: rc != code,
"GT": lambda rc, code: rc > code,
"GE": lambda rc, code: rc >= code,
"LT": lambda rc, code: rc < code,
"LE": lambda rc, code: rc <= code,
}
def parse_jcl(filepath: str) -> Job:
"""Parse a JCL file into a Job object."""
with open(filepath, "r", encoding="utf-8") as f:
raw_lines = f.readlines()
# Continuation handling: lines ending with ',' continue on next line
lines = _merge_continuations(raw_lines)
job = None
current_step: Optional[JobStep] = None
current_dd: Optional[DDEntry] = None
in_sysin = False
sysin_lines: list[str] = []
for line in lines:
stripped = line.strip()
# Skip comments
if stripped.startswith("//*"):
continue
if not stripped:
continue
# Handle SYSIN inline data (lines after //SYSIN DD * until /*)
if in_sysin:
if stripped == "/*":
if current_dd:
current_dd.inline_data = sysin_lines
sysin_lines = []
in_sysin = False
current_dd = None
else:
sysin_lines.append(stripped)
continue
# Must start with //
if not stripped.startswith("//"):
continue
content = stripped[2:].strip()
# JOB statement: //jobname JOB ...
if re.search(r"\bJOB\b", content, re.IGNORECASE):
parts = stripped[2:].split(None, 2)
job_name = parts[0]
job = Job(job_name=job_name)
continue
# EXEC statement
match = re.match(r"(\w+)\s+EXEC\s+(?:PGM=)?(\w+)", content, re.IGNORECASE)
if match:
step_name = match.group(1)
program = match.group(2)
# Parse COND parameter
cond = None
cond_match = re.search(
r"COND=\s*\(\s*(\d+)\s*,\s*(\w+)", content, re.IGNORECASE
)
if cond_match:
code = int(cond_match.group(1))
op = cond_match.group(2).upper()
cond = CondParam(code=code, operator=op)
# Parse PARM parameter
parm = None
parm_match = re.search(r"PARM=\s*'([^']*)'", content, re.IGNORECASE)
if parm_match:
parm = parm_match.group(1)
current_step = JobStep(
step_name=step_name,
program=program,
cond=cond,
parm=parm,
)
if job:
job.steps.append(current_step)
continue
# DD statement
dd_match = re.match(r"(\w+)\s+DD\s*(.*)", content, re.IGNORECASE)
if dd_match and current_step is not None:
dd_name = dd_match.group(1)
dd_params = dd_match.group(2)
dd = DDEntry(dd_name=dd_name)
# Parse DSN
dsn_match = re.search(r"DSN=\s*([^\s,]+)", dd_params, re.IGNORECASE)
if dsn_match:
dd.dsn = dsn_match.group(1)
# Parse DISP
disp_match = re.search(
r"DISP=\s*\(?([^,\s)]+)(?:,([^,\s)]+))?(?:,([^,\s)]+))?\)?",
dd_params, re.IGNORECASE,
)
if disp_match:
dd.disp = disp_match.group(1)
# Parse SYSOUT
sysout_match = re.search(r"SYSOUT=\s*(\*|\w+)", dd_params, re.IGNORECASE)
if sysout_match:
dd.sysout = sysout_match.group(1)
# Check for SYSIN inline data
if dd_name.upper() == "SYSIN" and "*" in dd_params:
in_sysin = True
current_step.dd_entries.append(dd)
current_dd = dd
continue
return job
def _merge_continuations(lines: list[str]) -> list[str]:
"""Merge JCL continuation lines (lines ending with ',')."""
merged = []
buffer = ""
for line in lines:
stripped = line.rstrip("\n\r")
if buffer:
buffer += stripped
else:
buffer = stripped
# Check if line ends with continuation
if stripped.rstrip().endswith(",") and not stripped.strip().startswith("//*"):
continue
merged.append(buffer)
buffer = ""
if buffer:
merged.append(buffer)
return merged