Files

90 lines
2.7 KiB
Python

from dataclasses import dataclass
EBCDIC_TO_ASCII = {
0xC1: 'A', 0xC2: 'B', 0xC3: 'C', 0xC4: 'D', 0xC5: 'E',
0xC6: 'F', 0xC7: 'G', 0xC8: 'H', 0xC9: 'I', 0xD1: 'J',
0xD2: 'K', 0xD3: 'L', 0xD4: 'M', 0xD5: 'N', 0xD6: 'O',
0xD7: 'P', 0xD8: 'Q', 0xD9: 'R', 0xE2: 'S', 0xE3: 'T',
0xE4: 'U', 0xE5: 'V', 0xE6: 'W', 0xE7: 'X', 0xE8: 'Y',
0xE9: 'Z', 0xF0: '0', 0xF1: '1', 0xF2: '2', 0xF3: '3',
0xF4: '4', 0xF5: '5', 0xF6: '6', 0xF7: '7', 0xF8: '8',
0xF9: '9', 0x40: ' ', 0x4B: '.', 0x6B: ',', 0x5A: '!',
}
@dataclass
class CobolIRField:
raw_hex: str
decoded_value: str
encoding: str
field_type: str
length: int
scale: int
signed: bool
@dataclass
class JavaIRField:
raw_value: str
decoded_value: str
field_type: str
nullable: bool
@dataclass
class IRRecord:
field_name: str
cobol: CobolIRField | None = None
java: JavaIRField | None = None
class Normalizer:
def normalize_encoding(self, raw: bytes, encoding: str) -> str:
if encoding == "EBCDIC":
return self._ebcdic_to_ascii(raw)
return raw.decode("ascii", errors="replace")
def normalize_comp3(self, raw: bytes) -> str:
if not raw:
return "0"
nibbles = []
for b in raw:
nibbles.append((b >> 4) & 0x0F)
nibbles.append(b & 0x0F)
sign = nibbles.pop()
value = 0
for n in nibbles:
value = value * 10 + n
if sign in (0x0D, 0x0B):
value = -value
return str(value)
def normalize_date(self, date_str: str) -> str:
s = date_str.strip()
if len(s) == 8 and s.isdigit():
return f"{s[0:4]}-{s[4:6]}-{s[6:8]}"
return s
def to_ir_record(self, field_name, raw_hex, decoded_value,
encoding, field_type, length=0, scale=0, signed=False) -> IRRecord:
return IRRecord(
field_name=field_name,
cobol=CobolIRField(
raw_hex=raw_hex, decoded_value=decoded_value,
encoding=encoding, field_type=field_type,
length=length, scale=scale, signed=signed))
def to_null_ir(self, field_name, side="java") -> IRRecord:
if side == "java":
return IRRecord(field_name=field_name,
cobol=None, java=JavaIRField(raw_value="", decoded_value="", field_type="null", nullable=True))
return IRRecord(field_name=field_name,
cobol=None, java=JavaIRField(raw_value="", decoded_value="", field_type="null", nullable=True))
def _ebcdic_to_ascii(self, raw: bytes) -> str:
result = []
for b in raw:
result.append(EBCDIC_TO_ASCII.get(b, chr(b) if 32 <= b < 127 else '?'))
return ''.join(result)