from dataclasses import dataclass EBCDIC_TO_ASCII = { 0xC1: 'A', 0xC2: 'B', 0xC3: 'C', 0xC4: 'D', 0xC5: 'E', 0xC6: 'F', 0xC7: 'G', 0xC8: 'H', 0xC9: 'I', 0xD1: 'J', 0xD2: 'K', 0xD3: 'L', 0xD4: 'M', 0xD5: 'N', 0xD6: 'O', 0xD7: 'P', 0xD8: 'Q', 0xD9: 'R', 0xE2: 'S', 0xE3: 'T', 0xE4: 'U', 0xE5: 'V', 0xE6: 'W', 0xE7: 'X', 0xE8: 'Y', 0xE9: 'Z', 0xF0: '0', 0xF1: '1', 0xF2: '2', 0xF3: '3', 0xF4: '4', 0xF5: '5', 0xF6: '6', 0xF7: '7', 0xF8: '8', 0xF9: '9', 0x40: ' ', 0x4B: '.', 0x6B: ',', 0x5A: '!', } @dataclass class CobolIRField: raw_hex: str decoded_value: str encoding: str field_type: str length: int scale: int signed: bool @dataclass class JavaIRField: raw_value: str decoded_value: str field_type: str nullable: bool @dataclass class IRRecord: field_name: str cobol: CobolIRField | None = None java: JavaIRField | None = None class Normalizer: def normalize_encoding(self, raw: bytes, encoding: str) -> str: if encoding == "EBCDIC": return self._ebcdic_to_ascii(raw) return raw.decode("ascii", errors="replace") def normalize_comp3(self, raw: bytes) -> str: if not raw: return "0" nibbles = [] for b in raw: nibbles.append((b >> 4) & 0x0F) nibbles.append(b & 0x0F) sign = nibbles.pop() value = 0 for n in nibbles: value = value * 10 + n if sign in (0x0D, 0x0B): value = -value return str(value) def normalize_date(self, date_str: str) -> str: s = date_str.strip() if len(s) == 8 and s.isdigit(): return f"{s[0:4]}-{s[4:6]}-{s[6:8]}" return s def to_ir_record(self, field_name, raw_hex, decoded_value, encoding, field_type, length=0, scale=0, signed=False) -> IRRecord: return IRRecord( field_name=field_name, cobol=CobolIRField( raw_hex=raw_hex, decoded_value=decoded_value, encoding=encoding, field_type=field_type, length=length, scale=scale, signed=signed)) def to_null_ir(self, field_name, side="java") -> IRRecord: if side == "java": return IRRecord(field_name=field_name, cobol=None, java=JavaIRField(raw_value="", decoded_value="", field_type="null", nullable=True)) return IRRecord(field_name=field_name, cobol=None, java=JavaIRField(raw_value="", decoded_value="", field_type="null", nullable=True)) def _ebcdic_to_ascii(self, raw: bytes) -> str: result = [] for b in raw: result.append(EBCDIC_TO_ASCII.get(b, chr(b) if 32 <= b < 127 else '?')) return ''.join(result)