Semantic AI for Future Industries: Bridging Explainability and Integration in Black Box Models

(Code and results of experiments related to the article submitted to ISM-2025: “International Conference on Industry of the Future and Smart Manufacturing”)

ABSTRACT

Artificial intelligence is increasingly used in industrial systems, yet the widespread adoption of black box models such as deep neural networks (NNs) presents challenges in transparency and interoperability. This paper introduces a novel Neuro-Symbolic eXplanation (NSX) pipeline that transforms black box analytics into explainable and integration-enable semantic representations using SWRL rules and reasoning. Our approach consists of several key steps: generating synthetic data; training decision trees to approximate the behavior of NNs; converting decision trees into SWRL rules, enabling automated and explainable ontology-based reasoning. This transformation enhances both explainability, by making model logic explicit, and integration, by providing a semantic framework for cross-system interoperability. To further enhance usability, we integrate ChatGPT as an external automated service via API for multiple tasks: mapping internal feature representations to human-readable ontology terms; generating natural language explanations for inferred rules; explaining classification outcomes based on reasoner-derived results; and translating SWRL rules into SPARQL queries for alternative reasoning. This hybrid approach is particularly valuable in industrial contexts such as predictive maintenance, quality control, and autonomous decision-making, where transparency and system integration are crucial. We experimentally demonstrate NSX-pipeline’s effectiveness and discuss its implications for future industries.

CODE AND EXPERIMENTS

Experiments with IRIS (most recent, verified, and included to the article)

# EXPERIMENTS WITH DECISION TREE DEPTH=3

import numpy as np

import pandas as pd

from sklearn.datasets import load_iris

from sklearn.model_selection import train_test_split

from sklearn.preprocessing import StandardScaler

from sklearn.neural_network import MLPClassifier

from sklearn.tree import DecisionTreeClassifier, export_text

import re

def load_and_process_data():

"""Loads and preprocesses the Iris dataset."""

iris = load_iris()

X = iris.data

y = iris.target

feature_names = iris.feature_names

class_names = iris.target_names

# Create feature mapping dictionary

feature_mapping = {f"f{i}": (f"hasF{i}", feature_names[i]) for i in range(len(feature_names))}

# Create class mapping dictionary

class_mapping = {f"class: {i}": (f"Class_{i}", class_names[i]) for i in range(len(class_names))}

# Split dataset

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Normalize features

scaler = StandardScaler()

X_train = scaler.fit_transform(X_train)

X_test = scaler.transform(X_test)

return X_train, X_test, y_train, y_test, feature_mapping, class_mapping, X.shape[1], scaler, X, y

def train_models(X_train, X_test, y_train, y_test, X_shape, scaler, X_original, y_original, num_synthetic_samples=None):

"""Trains a neural network and a decision tree."""

mlp = MLPClassifier(hidden_layer_sizes=(50,), max_iter=2000, random_state=42, alpha=0.01)

mlp.fit(X_train, y_train)

print(f'NN Test Accuracy: {mlp.score(X_test, y_test):.4f}')

# ---------- Refined Stage 2: Generate Synthetic Samples ----------

def generate_synthetic_samples(model, X_shape, scaler, num_samples_per_class):

"""Generates synthetic samples using a trained neural network."""

synthetic_samples = []

synthetic_labels = []

# Get min/max feature ranges from original (scaled) data

feature_ranges = [(scaler.inverse_transform(np.array([[X_train[:, i].min() if j == i else 0 for j in range(X_shape)]]))[0][i], scaler.inverse_transform(np.array([[X_train[:, i].max() if j == i else 0 for j in range(X_shape)]]))[0][i]) for i in range(X_shape)]

class_counts = [0, 0, 0] # Keep track of number of samples of each class

target_count = num_samples_per_class if num_samples_per_class else len(X_train) // 3

while min(class_counts) < target_count:

#Generate a synthetic sample within the feature ranges

sample = np.array([np.random.uniform(low, high) for low, high in feature_ranges])

# Scale the sample according to our feature scaling

sample_scaled = scaler.transform(sample.reshape(1, -1))

# Get NN probability predictions

synthetic_probs = model.predict_proba(sample_scaled)

# Select label according to the highest probability

synthetic_label = np.argmax(synthetic_probs)

# Only append if the class is below the target number

if class_counts[synthetic_label] < target_count:

synthetic_samples.append(sample)

synthetic_labels.append(synthetic_label)

class_counts[synthetic_label] += 1

return np.array(synthetic_samples), np.array(synthetic_labels)

# Generate synthetic data

X_synthetic, y_synthetic = generate_synthetic_samples(mlp, X_shape, scaler, num_synthetic_samples)

# Print the distribution of labels in the synthetic data

print(f"Synthetic data class distribution: {np.unique(y_synthetic, return_counts=True)}")

# Print the predictions of the NN in the training data

y_train_pred = mlp.predict(X_train)

print(f"NN training data class distribution: {np.unique(y_train_pred, return_counts=True)}")

# ---------- End of Refined Stage 2 ----------

# Scale the synthetic data

X_synthetic_scaled = scaler.transform(X_synthetic)

# Train decision tree on the synthetic data

clf = DecisionTreeClassifier(max_depth=7, random_state=42)

clf.fit(X_synthetic_scaled, y_synthetic)

# Evaluate the decision tree on the original data

X_original_scaled = scaler.transform(X_original)

dt_accuracy = clf.score(X_original_scaled, y_original)

print(f"Decision Tree Accuracy on Original Iris Data: {dt_accuracy:.4f}")

return clf, mlp, X_synthetic, scaler

def generate_swrl_rules(clf, feature_names, class_mapping, scaler):

"""Generates SWRL rules from a decision tree."""

rules = []

def recurse(node, conditions, variable_conditions, parent_bounds):

if clf.tree_.children_left[node] == -1 and clf.tree_.children_right[node] == -1:

predicted_class = np.argmax(clf.tree_.value[node])

class_name = class_mapping[f"class: {predicted_class}"][0]

rule = "Unclassified(?p) ^ " + " ^ ".join(sorted(conditions)) + f' -> {class_name}(?p)'

rules.append(rule)

return

feature_index = clf.tree_.feature[node]

feature = feature_names[feature_index]

threshold = clf.tree_.threshold[node]

var = f'?x{feature_index + 1}'

new_conditions = conditions.copy()

new_variable_conditions = variable_conditions.copy()

#Add the feature condition if not already present

if var not in variable_conditions:

new_conditions.append(f'has{feature.capitalize().replace(" ", "")}(?p, {var})')

new_variable_conditions.add(var)

#Inverse transform the thresholds to the original scale

reference_vector = np.zeros((1,len(feature_names)))

reference_vector[0][feature_index] = threshold

threshold_original_scale = scaler.inverse_transform(reference_vector)[0][feature_index]

left_condition = f'swrlb:lessThanOrEqual({var}, {threshold_original_scale:.2f})'

right_condition = f'swrlb:greaterThan({var}, {threshold_original_scale:.2f})'

new_parent_bounds = parent_bounds.copy()

# Avoid redundant conditions

if not any(v == var and op == "leq" and threshold >= t for v, op, t in parent_bounds):

new_parent_bounds.append((var, "leq", threshold))

if not any(v == var and op == "gt" and threshold <= t for v, op, t in parent_bounds):

new_parent_bounds.append((var, "gt", threshold))

recurse(clf.tree_.children_left[node], new_conditions + [left_condition], new_variable_conditions.copy(), new_parent_bounds)

recurse(clf.tree_.children_right[node], new_conditions + [right_condition], new_variable_conditions.copy(), new_parent_bounds)

recurse(0, [], set(), [])

return rules

def optimize_swrl_rule(rule):

"""Optimizes a SWRL rule by removing redundant conditions."""

parts = rule.split('->')

if len(parts) != 2:

return rule # If no class, return the rule.

left_part = parts[0].strip()

right_part = parts[1].strip()

parts = left_part.split(' ^ ')

has_conditions = [part for part in parts if part.startswith('has')]

swrl_conditions = [part for part in parts if part.startswith('swrlb:')]

var_conditions = {}

for cond in swrl_conditions:

match = re.match(r'swrlb:(lessThanOrEqual|greaterThanOrEqual|lessThan|greaterThan)\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', cond)

if match:

var = match.group('variable')

op = match.group(1)

value = float(match.group('value'))

if var not in var_conditions:

var_conditions[var] = []

var_conditions[var].append((op, value, cond))

optimized_conditions = []

for var, conditions in var_conditions.items():

# Group conditions by operator type

leq_conditions = [cond for op, _, cond in conditions if op == "lessThanOrEqual"]

geq_conditions = [cond for op, _, cond in conditions if op == "greaterThanOrEqual"]

lt_conditions = [cond for op, _, cond in conditions if op == "lessThan"]

gt_conditions = [cond for op, _, cond in conditions if op == "greaterThan"]

# Optimize each group separately

if leq_conditions:

best_leq = leq_conditions[0]

for cond in leq_conditions:

match = re.match(r'swrlb:lessThanOrEqual\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', cond)

if match and float(match.group('value')) < float(re.match(r'swrlb:lessThanOrEqual\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', best_leq).group('value')):

best_leq = cond

optimized_conditions.append(best_leq)

if geq_conditions:

best_geq = geq_conditions[0]

for cond in geq_conditions:

match = re.match(r'swrlb:greaterThanOrEqual\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', cond)

if match and float(match.group('value')) > float(re.match(r'swrlb:greaterThanOrEqual\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', best_geq).group('value')):

best_geq = cond

optimized_conditions.append(best_geq)

if lt_conditions:

best_lt = lt_conditions[0]

for cond in lt_conditions:

match = re.match(r'swrlb:lessThan\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', cond)

if match and float(match.group('value')) < float(re.match(r'swrlb:lessThan\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', best_lt).group('value')):

best_lt = cond

optimized_conditions.append(best_lt)

if gt_conditions:

best_gt = gt_conditions[0]

for cond in gt_conditions:

match = re.match(r'swrlb:greaterThan\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', cond)

if match and float(match.group('value')) > float(re.match(r'swrlb:greaterThan\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', best_gt).group('value')):

best_gt = cond

optimized_conditions.append(best_gt)

optimized_rule = "Unclassified(?p) ^ " + " ^ ".join(sorted(has_conditions + optimized_conditions)) + " -> " + right_part

return optimized_rule

def optimize_inter_swrl_rules(rules):

"""Optimizes SWRL rules by removing inter-rule redundancies, considering condition specificity."""

def is_specialization(rule1, rule2):

"""Check if rule1 is a specialization of rule2"""

parts1 = rule1.split("->")[0].strip().split(" ^ ")

parts2 = rule2.split("->")[0].strip().split(" ^ ")

#Remove Unclassified from the rules

parts1 = [part for part in parts1 if part != "Unclassified(?p)"]

parts2 = [part for part in parts2 if part != "Unclassified(?p)"]

if len(parts1) < len(parts2):

return False # If rule1 has fewer conditions, it can't be a specialization.

if not all(cond in parts1 for cond in parts2):

return False # Rule1 must include all conditions of rule2

if len(parts1) == len(parts2):

return False # If the rules have the same length, it can't be a specialization

swrl_conditions1 = [part for part in parts1 if part.startswith('swrlb:')]

swrl_conditions2 = [part for part in parts2 if part.startswith('swrlb:')]

var_conditions1 = {}

for cond in swrl_conditions1:

match = re.match(r'swrlb:(lessThanOrEqual|greaterThanOrEqual|lessThan|greaterThan)\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', cond)

if match:

var = match.group('variable')

op = match.group(1)

value = float(match.group('value'))

if var not in var_conditions1:

var_conditions1[var] = []

var_conditions1[var].append((op, value, cond))

var_conditions2 = {}

for cond in swrl_conditions2:

match = re.match(r'swrlb:(lessThanOrEqual|greaterThanOrEqual|lessThan|greaterThan)\((?P<variable>\?x\d+), (?P<value>[+-]?\d+\.?\d*)\)', cond)

if match:

var = match.group('variable')

op = match.group(1)

value = float(match.group('value'))

if var not in var_conditions2:

var_conditions2[var] = []

var_conditions2[var].append((op, value, cond))

for var, conditions1 in var_conditions1.items():

if var in var_conditions2:

conditions2 = var_conditions2[var]

#If there are conditions on both rules, lets make sure there is one more specific condition

min_leq1 = float('inf')

max_geq1 = float('-inf')

has_leq1 = False

has_geq1 = False

for op, value, cond in conditions1:

if op == "lessThanOrEqual":

min_leq1 = value

has_leq1 = True

elif op == "greaterThanOrEqual":

max_geq1 = value

has_geq1 = True

min_leq2 = float('inf')

max_geq2 = float('-inf')

has_leq2 = False

has_geq2 = False

for op, value, cond in conditions2:

if op == "lessThanOrEqual":

min_leq2 = value

has_leq2 = True

elif op == "greaterThanOrEqual":

max_geq2 = value

has_geq2 = True

if has_leq2 and not has_leq1:

return True

if has_geq2 and not has_geq1:

return True

if has_leq1 and has_leq2 and min_leq1 < min_leq2:

return True

if has_geq1 and has_geq2 and max_geq1 > max_geq2:

return True

return False #If no specialization is found, then the rules are independent.

optimized_rules = []

for i, rule1 in enumerate(rules):

is_redundant = False

for j, rule2 in enumerate(rules):

if i!=j and rule1.split("->")[1].strip() == rule2.split("->")[1].strip() and is_specialization(rule1, rule2):

is_redundant = True

break

if not is_redundant:

optimized_rules.append(rule1)

return optimized_rules

# Main execution

X_train, X_test, y_train, y_test, feature_mapping, class_mapping, X_shape, scaler, X_original, y_original = load_and_process_data()

clf, mlp, X_synthetic, scaler = train_models(X_train, X_test, y_train, y_test, X_shape, scaler, X_original, y_original, num_synthetic_samples=400)

# Print decision tree rules

print('\nExtracted Decision Tree Rules:\n')

print(export_text(clf, feature_names=[f"f{i}" for i in range(X_synthetic.shape[1])]))

for key, (swrl_name, actual_name) in feature_mapping.items():

print(f"{key} (Decision tree); {swrl_name} (SWRL rules); {actual_name} (name of attribute in the original dataset);")

print('\n')

for key, (swrl_name, actual_name) in class_mapping.items():

print(f"{key} (Decision tree); {swrl_name} (SWRL rules); {actual_name} (name of class in the original dataset);")

# Generate and print SWRL rules

swrl_rules = generate_swrl_rules(clf, [f"f{i}" for i in range(X_synthetic.shape[1])], class_mapping, scaler)

print('\nGenerated SWRL Rules:\n')

for rule in swrl_rules:

print(rule)

# Optimize SWRL rules

optimized_rules = [optimize_swrl_rule(rule) for rule in swrl_rules]

print('\nOptimized SWRL Rules (Intra-Rule Redundancy Removed):\n')

for rule in optimized_rules:

print(rule)

optimized_rules = optimize_inter_swrl_rules(optimized_rules)

print('\nOptimized SWRL Rules (Inter-Rule Redundancy Removed):\n')

for rule in optimized_rules:

print(rule)

NN Test Accuracy: 1.0000

Synthetic data class distribution: (array([0, 1, 2]), array([400, 400, 400]))

NN training data class distribution: (array([0, 1, 2]), array([40, 39, 41]))

Decision Tree Accuracy on Original Iris Data: 0.9000

Extracted Decision Tree

with normalized attributes:

|--- f3 <= 0.70

| |--- f0 <= 0.40

| | |--- f1 <= 0.04

| | | |--- class: 1

| | |--- f1 > 0.04

| | | |--- class: 0

| |--- f0 > 0.40

| | |--- f1 <= 1.84

| | | |--- class: 1

| | |--- f1 > 1.84

| | | |--- class: 1

|--- f3 > 0.70

| |--- f2 <= 0.15

| | |--- f1 <= 0.27

| | | |--- class: 2

| | |--- f1 > 0.27

| | | |--- class: 0

| |--- f2 > 0.15

| | |--- f1 <= 1.65

| | | |--- class: 2

| | |--- f1 > 1.65

| | | |--- class: 2

Name Mappings:

f0 (Decision tree); hasF0 (SWRL rules); sepal length (cm) (name of attribute in the original dataset);

f1 (Decision tree); hasF1 (SWRL rules); sepal width (cm) (name of attribute in the original dataset);

f2 (Decision tree); hasF2 (SWRL rules); petal length (cm) (name of attribute in the original dataset);

f3 (Decision tree); hasF3 (SWRL rules); petal width (cm) (name of attribute in the original dataset);

class: 0 (Decision tree); Class_0 (SWRL rules); setosa (name of class in the original dataset);

class: 1 (Decision tree); Class_1 (SWRL rules); versicolor (name of class in the original dataset);

class: 2 (Decision tree); Class_2 (SWRL rules); virginica (name of class in the original dataset);

Generated SWRL Rules:

Unclassified(?p) ^ hasF0(?p, ?x1) ^ hasF1(?p, ?x2) ^ hasF3(?p, ?x4) ^ swrlb:lessThanOrEqual(?x1, 6.14) ^ swrlb:lessThanOrEqual(?x2, 3.08) ^ swrlb:lessThanOrEqual(?x4, 1.70) -> Class_1(?p)

Unclassified(?p) ^ hasF0(?p, ?x1) ^ hasF1(?p, ?x2) ^ hasF3(?p, ?x4) ^ swrlb:greaterThan(?x2, 3.08) ^ swrlb:lessThanOrEqual(?x1, 6.14) ^ swrlb:lessThanOrEqual(?x4, 1.70) -> Class_0(?p)

Unclassified(?p) ^ hasF0(?p, ?x1) ^ hasF1(?p, ?x2) ^ hasF3(?p, ?x4) ^ swrlb:greaterThan(?x1, 6.14) ^ swrlb:lessThanOrEqual(?x2, 3.89) ^ swrlb:lessThanOrEqual(?x4, 1.70) -> Class_1(?p)

Unclassified(?p) ^ hasF0(?p, ?x1) ^ hasF1(?p, ?x2) ^ hasF3(?p, ?x4) ^ swrlb:greaterThan(?x1, 6.14) ^ swrlb:greaterThan(?x2, 3.89) ^ swrlb:lessThanOrEqual(?x4, 1.70) -> Class_1(?p)

Unclassified(?p) ^ hasF1(?p, ?x2) ^ hasF2(?p, ?x3) ^ hasF3(?p, ?x4) ^ swrlb:greaterThan(?x4, 1.70) ^ swrlb:lessThanOrEqual(?x2, 3.18) ^ swrlb:lessThanOrEqual(?x3, 4.00) -> Class_2(?p)

Unclassified(?p) ^ hasF1(?p, ?x2) ^ hasF2(?p, ?x3) ^ hasF3(?p, ?x4) ^ swrlb:greaterThan(?x2, 3.18) ^ swrlb:greaterThan(?x4, 1.70) ^ swrlb:lessThanOrEqual(?x3, 4.00) -> Class_0(?p)

Unclassified(?p) ^ hasF1(?p, ?x2) ^ hasF2(?p, ?x3) ^ hasF3(?p, ?x4) ^ swrlb:greaterThan(?x3, 4.00) ^ swrlb:greaterThan(?x4, 1.70) ^ swrlb:lessThanOrEqual(?x2, 3.80) -> Class_2(?p)

Unclassified(?p) ^ hasF1(?p, ?x2) ^ hasF2(?p, ?x3) ^ hasF3(?p, ?x4) ^ swrlb:greaterThan(?x2, 3.80) ^ swrlb:greaterThan(?x3, 4.00) ^ swrlb:greaterThan(?x4, 1.70) -> Class_2(?p)

Optimized SWRL Rules (Intra-Rule Redundancy Removed):